Load libraries and public variables
# File that contains simulation output data in a HDF5 directory structure specified in "/publicVariables/createPublicVariables.Rmd"
simOutputH5 <- paste0("../../dataProcessing/simOutputH5Data/", experimentID, "_output.h5")
# A comprehensive table that contains all simulation input and calculated output metrics
allSimInputOutput <- read_feather("../allSimInputOutput.feather")
# This folder contains raw output files from the simulations. This is needed for calculate_para_sp_mcpsr()
rawSimOutFolder <- "/team/batch_SMOTNT/experiment1_output"
# Where figures are stored
figureBaseFolder <- "../figures/"
Validation: compare the protein synthesis rates with Weinberg 2016
weinbergData <- read_tsv("../externalData/weinberg_synthesis.txt")
Rows: 4839 Columns: 16
── Column specification ───────────────────────────────────────────────────────────────────────────────────────────────────────────────────
Delimiter: "\t"
chr (1): ORF
dbl (15): Length, RPF, mRNA, TE, IP, FEatg, FEcap, cRPF, cTE, uATG, utr, gc, pE, Ai, S
ℹ Use `spec()` to retrieve the full column specification for this data.
ℹ Specify the column types or set `show_col_types = FALSE` to quiet this message.
validationPlot <- allSimInputOutput %>%
filter(paraCombo == "mRNAconstant") %>%
select(ORF, paraCombo, MPSR, dc, r) %>%
left_join(weinbergData[, c("ORF", "S")], by = "ORF") %>%
mutate(S_perMin=S*60,
newcombo=factor(paraCombo, levels=dc.r.df$paraCombo[2:25])) %>%
ggplot(aes(x=MPSR, y=S_perMin)) +
geom_abline(linetype="dashed") +
geom_point() +
geom_smooth(method="lm") +
stat_cor(aes(label=paste(..r.label.., sep = "~`, `~")), label.x.npc = 0.1, label.y.npc = 0.7, size=10) +
scale_x_log10() +
scale_y_log10() +
theme_bw() +
labs(x="Mean protein synthesis rates for mRNA constant",
y="Protein synthesis rate estimates by Weinberg et al 2016")
validationPlot
`geom_smooth()` using formula 'y ~ x'
Warning: Removed 123 rows containing non-finite values (stat_smooth).
Warning: Removed 123 rows containing non-finite values (stat_cor).
Warning: Removed 123 rows containing missing values (geom_point).

write_rds(validationPlot, "../figures/validationPlot.rds")
tmp <- allSimInputOutput %>%
filter(paraCombo == "mRNAconstant") %>%
select(ORF, paraCombo, MPSR) %>%
left_join(weinbergData[, c("ORF", "S")], by = "ORF") %>%
mutate(S_perMin=S*60)
# quick try of piping the t test didn't work..
t.test(tmp$S_perMin, tmp$MPSR, paired = TRUE)
Paired t-test
data: tmp$S_perMin and tmp$MPSR
t = 2.7885, df = 4715, p-value = 0.005317
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
0.7112053 4.0789951
sample estimates:
mean of the differences
2.3951
figS0_a <- allSimInputOutput %>%
filter(paraCombo=="mRNAconstant"|paraCombo=="dc_1_r_0", ORF!="YER053C-A") %>%
ggplot(aes(x=MPSR, y=PMPSR, color = paraCombo)) +
geom_point(size = 0.5) +
geom_abline(linetype="dashed") +
theme_bw() +
theme(text = element_text(size = 13),
legend.position = "top",
strip.text = element_text(color="white"), # can't use element_blank() here because it gives error when p1+p2
plot.margin = margin(r = 0, unit = "pt"),
panel.grid = element_blank()
) +
labs(x = 'Mean of protein synthesis rate'~(min^-1),
y = 'Predicted mean of protein synthesis rate'~(min^-1)) +
scale_color_manual(name="", labels=c("mRNAconstant"="mRNAconstant", "dc_1_r_0"="mRNAvarying"), values = c("#1F78B4", "#FF7F00")) +
geom_smooth(method="lm") +
stat_cor(aes(label=paste(..r.label.., sep = "~`,`~")), label.x.npc = 0.7, label.y.npc = 0.4, size=5) +
scale_x_log10() +
scale_y_log10()
figS0_a
`geom_smooth()` using formula 'y ~ x'

write_rds(figS0_a,"../figures/figS0_a.rds")
######################################################
figS0_b <- allSimInputOutput %>%
filter(paraCombo=="dc_1_r_0", ORF!="YER053C-A") %>%
select(paraCombo, ORF, MVPS, PMPSR, mRNASynRateTotal_sec) %>%
mutate(mRNASynRateTotal_min = mRNASynRateTotal_sec*60,
additiveVar = PMPSR + mRNASynRateTotal_min,
multiplicativeVar = PMPSR * mRNASynRateTotal_min + PMPSR^2*mRNASynRateTotal_min + PMPSR*mRNASynRateTotal_min^2) %>%
select(ORF, MVPS, additiveVar, multiplicativeVar) %>%
pivot_longer(names_to = "predictedVar", values_to = "predictedVarValue", cols = -c(ORF,MVPS)) %>%
ggplot(aes(x=MVPS, y=predictedVarValue, color = predictedVar)) +
geom_point(size = 0.5) +
geom_abline(linetype="dashed") +
theme_bw() +
theme(text = element_text(size = 13),
legend.position = "top",
strip.text = element_text(color="white"), # can't use element_blank() here because it gives error when p1+p2
plot.margin = margin(r = 0, unit = "pt"),
panel.grid = element_blank()
) +
labs(x = 'Variance of protein synthesis rate'~(min^-1),
y = 'Predicted variance of protein synthesis rate'~(min^-1)) +
scale_color_manual(name="", labels=c("mRNAconstant"="mRNAconstant", "dc_1_r_0"="mRNAvarying"), values = c("#1F78B4", "#FF7F00")) +
geom_smooth(method="lm") +
stat_cor(aes(label=paste(..r.label.., sep = "~`,`~")), label.x.npc = 0.7, label.y.npc = 0.4, size=5) +
scale_x_log10() +
scale_y_log10()
figS0_b
Warning: Transformation introduced infinite values in continuous y-axis
Warning: Transformation introduced infinite values in continuous y-axis
Warning: Transformation introduced infinite values in continuous y-axis
`geom_smooth()` using formula 'y ~ x'
Warning: Removed 31 rows containing non-finite values (stat_smooth).
Warning: Removed 31 rows containing non-finite values (stat_cor).

write_rds(figS0_b, "../figures/figS0_b.rds")
######################################################
figS0_c <- allSimInputOutput %>%
filter(paraCombo=="dc_1_r_0", ORF!="YER053C-A") %>%
select(paraCombo, ORF, MPSR, RMPSR) %>%
ggplot(aes(x = MPSR, y = RMPSR)) +
geom_point(size = 0.5) +
#geom_abline(linetype="dashed") +
geom_hline(yintercept = 1, linetype="dashed") +
theme_bw() +
theme(text = element_text(size = 13),
legend.position = "top",
strip.text = element_text(color="white"), # can't use element_blank() here because it gives error when p1+p2
plot.margin = margin(r = 0, unit = "pt"),
panel.grid = element_blank()
) +
labs(x = 'mean prot syn rate for mRNAvarying'~(min^-1),
y = 'relative mean prot syn rate for mRNAvarying'~(min^-1)) +
#scale_color_manual(name="", labels=c("mRNAconstant"="mRNAconstant", "dc_1_r_0"="mRNAvarying"), values = c("#1F78B4", "#FF7F00")) +
geom_smooth() +
stat_cor(aes(label=paste(..r.label.., sep = "~`,`~")), label.x.npc = 0.7, label.y.npc = 0.4, size=5) +
scale_x_log10()
figS0_c
`geom_smooth()` using method = 'gam' and formula 'y ~ s(x, bs = "cs")'

write_rds(figS0_c, "../figures/figS0_c.rds")
######################################################
figS0_d <- allSimInputOutput %>%
filter(paraCombo=="dc_1_r_0", ORF!="YER053C-A") %>%
select(paraCombo, ORF, MPSR, RMPSR) %>%
arrange(MPSR) %>%
# mutate(binNames = c(unlist(lapply(1:19, function(x){rep(x,254)})), rep(20,12))) %>% # bin all 4838 genes into 20 bins, each contains same number of genes ordered by their MPSR
# ggplot(aes(x = factor(binNames, levels = 1:20), y = RMPSR)) +
mutate(binNames = c(unlist(lapply(1:9, function(x){rep(x,537)})), rep(10,5))) %>% # bin all 4838 genes into 10 bins, each contains same number of genes ordered by their MPSR
ggplot(aes(x = factor(binNames, levels = 1:10), y = RMPSR)) +
geom_boxplot() +
#geom_abline(linetype="dashed") +
geom_hline(yintercept = 1, linetype="dashed") +
theme_bw() +
theme(text = element_text(size = 13),
legend.position = "top",
strip.text = element_text(color="white"), # can't use element_blank() here because it gives error when p1+p2
plot.margin = margin(r = 0, unit = "pt"),
panel.grid = element_blank()
) +
labs(x = 'mean prot syn rate for mRNAvarying'~(min^-1),
y = 'relative mean prot syn rate for mRNAvarying'~(min^-1)) +
#scale_color_manual(name="", labels=c("mRNAconstant"="mRNAconstant", "dc_1_r_0"="mRNAvarying"), values = c("#1F78B4", "#FF7F00")) +
geom_smooth() +
stat_cor(aes(label=paste(..r.label.., sep = "~`,`~")), label.x.npc = 0.7, label.y.npc = 0.4, size=5)
figS0_d
`geom_smooth()` using method = 'loess' and formula 'y ~ x'

write_rds(figS0_d, "../figures/figS0_d.rds")
######################################################
figS0_e <- allSimInputOutput %>%
filter(paraCombo=="dc_1_r_0", ORF!="YER053C-A") %>%
select(paraCombo, ORF, MPSR, RMPSR) %>%
arrange(MPSR) %>%
# mutate(binNames = c(unlist(lapply(1:19, function(x){rep(x,254)})), rep(20,12))) %>% # bin all 4838 genes into 20 bins, each contains same number of genes ordered by their MPSR
# ggplot(aes(x = factor(binNames, levels = 1:20), y = RMPSR)) +
mutate(binNames = c(unlist(lapply(1:9, function(x){rep(x,537)})), rep(10,5))) %>% # bin all 4838 genes into 10 bins, each contains same number of genes ordered by their MPSR
group_by(binNames) %>%
mutate(test = RMPSR>1) %>%
#mutate(freqRMPSRabove1 = sum(test)/n()) %>%
summarize(freqRMPSRabove1 = sum(test)/n()) %>%
ggplot(aes(x = factor(binNames, levels = 1:10), y = freqRMPSRabove1)) +
geom_bar(stat='identity') +
#geom_abline(linetype="dashed") +
#geom_hline(yintercept = 1, linetype="dashed") +
theme_bw() +
theme(text = element_text(size = 13),
legend.position = "top",
strip.text = element_text(color="white"), # can't use element_blank() here because it gives error when p1+p2
plot.margin = margin(r = 0, unit = "pt"),
panel.grid = element_blank()
) +
labs(x = 'bins of genes',
y = 'freq of rel. mean prot syn rate above 1 in each bin')
figS0_e

write_rds(figS0_e, "../figures/figS0_e.rds")
######################################################
figS0_f <- allSimInputOutput %>%
filter(paraCombo=="dc_1_r_0", ORF!="YER053C-A") %>%
select(paraCombo, ORF, mRNAabundance, RMPSR) %>%
ggplot(aes(x = mRNAabundance, y = RMPSR)) +
geom_point(size = 0.5) +
#geom_abline(linetype="dashed") +
geom_hline(yintercept = 1, linetype="dashed") +
theme_bw() +
theme(text = element_text(size = 13),
legend.position = "top",
strip.text = element_text(color="white"), # can't use element_blank() here because it gives error when p1+p2
plot.margin = margin(r = 0, unit = "pt"),
panel.grid = element_blank()
) +
labs(x = 'mRNA abundances',
y = 'relative mean prot syn rate for mRNAvarying'~(min^-1)) +
#scale_color_manual(name="", labels=c("mRNAconstant"="mRNAconstant", "dc_1_r_0"="mRNAvarying"), values = c("#1F78B4", "#FF7F00")) +
geom_smooth() +
stat_cor(aes(label=paste(..r.label.., sep = "~`,`~")), label.x.npc = 0.7, label.y.npc = 0.4, size=5) +
scale_x_log10()
figS0_f
`geom_smooth()` using method = 'gam' and formula 'y ~ s(x, bs = "cs")'

write_rds(figS0_f, "../figures/figS0_f.rds")
######################################################
figS0_g <- allSimInputOutput %>%
filter(paraCombo=="dc_1_r_0", ORF!="YER053C-A") %>%
select(paraCombo, ORF, CAI, RMPSR) %>%
ggplot(aes(x = CAI, y = RMPSR)) +
geom_point(size = 0.5) +
#geom_abline(linetype="dashed") +
geom_hline(yintercept = 1, linetype="dashed") +
theme_bw() +
theme(text = element_text(size = 13),
legend.position = "top",
strip.text = element_text(color="white"), # can't use element_blank() here because it gives error when p1+p2
plot.margin = margin(r = 0, unit = "pt"),
panel.grid = element_blank()
) +
labs(x = 'CAI',
y = 'relative mean prot syn rate for mRNAvarying'~(min^-1)) +
#scale_color_manual(name="", labels=c("mRNAconstant"="mRNAconstant", "dc_1_r_0"="mRNAvarying"), values = c("#1F78B4", "#FF7F00")) +
geom_smooth() +
stat_cor(aes(label=paste(..r.label.., sep = "~`,`~")), label.x.npc = 0.7, label.y.npc = 0.4, size=5)
figS0_g
`geom_smooth()` using method = 'gam' and formula 'y ~ s(x, bs = "cs")'

write_rds(figS0_g, "../figures/figS0_g.rds")
######################################################
figS0_h <- allSimInputOutput %>%
filter(paraCombo=="dc_1_r_0", ORF!="YER053C-A") %>%
select(paraCombo, ORF, iniProb, RMPSR) %>%
ggplot(aes(x = iniProb, y = RMPSR)) +
geom_point(size = 0.5) +
#geom_abline(linetype="dashed") +
geom_hline(yintercept = 1, linetype="dashed") +
theme_bw() +
theme(text = element_text(size = 13),
legend.position = "top",
strip.text = element_text(color="white"), # can't use element_blank() here because it gives error when p1+p2
plot.margin = margin(r = 0, unit = "pt"),
panel.grid = element_blank()
) +
labs(x = 'translation initiation probability',
y = 'relative mean prot syn rate for mRNAvarying'~(min^-1)) +
#scale_color_manual(name="", labels=c("mRNAconstant"="mRNAconstant", "dc_1_r_0"="mRNAvarying"), values = c("#1F78B4", "#FF7F00")) +
geom_smooth() +
stat_cor(aes(label=paste(..r.label.., sep = "~`,`~")), label.x.npc = 0.7, label.y.npc = 0.4, size=5) +
scale_x_log10()
figS0_h
`geom_smooth()` using method = 'gam' and formula 'y ~ s(x, bs = "cs")'

write_rds(figS0_h, "../figures/figS0_h.rds")
######################################################
figS0_i <- allSimInputOutput %>%
filter(paraCombo=="dc_1_r_0", ORF!="YER053C-A") %>%
#mutate(intCtrlOrNot = ifelse(mRNADecRateNeymotin_sec==0,"intCtrl","nonCtrl")) %>%
#select(paraCombo, ORF, geneLength_codon, RMPSR, intCtrlOrNot) %>%
select(paraCombo, ORF, geneLength_codon, RMPSR) %>%
#ggplot(aes(x = geneLength_codon, y = RMPSR, color = intCtrlOrNot)) +
ggplot(aes(x = geneLength_codon, y = RMPSR)) +
geom_point(size = 0.5) +
#geom_abline(linetype="dashed") +
geom_hline(yintercept = 1, linetype="dashed") +
theme_bw() +
theme(text = element_text(size = 13),
legend.position = "top",
strip.text = element_text(color="white"), # can't use element_blank() here because it gives error when p1+p2
plot.margin = margin(r = 0, unit = "pt"),
panel.grid = element_blank()
) +
labs(x = 'gene length (codon)',
y = 'relative mean prot syn rate for mRNAvarying'~(min^-1)) +
#scale_color_manual(name="", labels=c("mRNAconstant"="mRNAconstant", "dc_1_r_0"="mRNAvarying"), values = c("#1F78B4", "#FF7F00")) +
geom_smooth() +
stat_cor(aes(label=paste(..r.label.., sep = "~`,`~")), label.x.npc = 0.7, label.y.npc = 0.4, size=5) +
scale_x_log10()
figS0_i
`geom_smooth()` using method = 'gam' and formula 'y ~ s(x, bs = "cs")'

write_rds(figS0_i, "../figures/figS0_i.rds")
######################################################
figS0_j <- allSimInputOutput %>%
filter(paraCombo=="dc_1_r_0", ORF!="YER053C-A") %>%
select(paraCombo, ORF, mRNADecRateNeymotin_min, RMPSR) %>%
ggplot(aes(x = mRNADecRateNeymotin_min, y = RMPSR)) +
geom_point(size = 0.5) +
#geom_abline(linetype="dashed") +
geom_hline(yintercept = 1, linetype="dashed") +
theme_bw() +
theme(text = element_text(size = 13),
legend.position = "top",
strip.text = element_text(color="white"), # can't use element_blank() here because it gives error when p1+p2
plot.margin = margin(r = 0, unit = "pt"),
panel.grid = element_blank()
) +
labs(x = 'mRNA decay rates from Neymotin data (min)',
y = 'relative mean prot syn rate for mRNAvarying'~(min^-1)) +
#scale_color_manual(name="", labels=c("mRNAconstant"="mRNAconstant", "dc_1_r_0"="mRNAvarying"), values = c("#1F78B4", "#FF7F00")) +
geom_smooth() +
stat_cor(aes(label=paste(..r.label.., sep = "~`,`~")), label.x.npc = 0.7, label.y.npc = 0.4, size=5) +
scale_x_log10()
figS0_j
Warning: Transformation introduced infinite values in continuous x-axis
Warning: Transformation introduced infinite values in continuous x-axis
Warning: Transformation introduced infinite values in continuous x-axis
`geom_smooth()` using method = 'gam' and formula 'y ~ s(x, bs = "cs")'
Warning: Removed 31 rows containing non-finite values (stat_smooth).
Warning: Removed 31 rows containing non-finite values (stat_cor).

write_rds(figS0_j, "../figures/figS0_j.rds")
######################################################
figS0_k <- allSimInputOutput %>%
filter(paraCombo!= "mRNAconstant") %>%
select(dc, r, RMFR) %>%
unique() %>%
ggplot(aes(x = dc, y = RMFR, color = factor(r))) +
geom_point() +
geom_line() +
# theme_bw() +
# theme(text = element_text(size = 13),
# legend.position = "top",
# strip.text = element_text(color="white"), # can't use element_blank() here because it gives error when p1+p2
# plot.margin = margin(r = 0, unit = "pt"),
# panel.grid = element_blank()
# ) +
labs(x = 'CMD levels',
y = 'Relative mean free ribosomes') +
scale_color_discrete(name = "Ribo protection index")
figS0_k
geom_path: Each group consists of only one observation. Do you need to adjust the group aesthetic?

write_rds(figS0_k, "../figures/figS0_k.rds")
######################################################
figS0_l <- allSimInputOutput %>%
filter(paraCombo=="dc_0_r_1", ORF!="YER053C-A") %>% #remove the gene with the 450min HL
# filter(paraCombo=="dc_0_r_1", ORF!="YER053C-A", mRNADecRateNeymotin_sec==0) %>%
# select("ORF", "RMPSR", "RMFR") %>%
mutate(intCtrlOrNot = ifelse(mRNADecRateNeymotin_sec==0,"intCtrl","nonCtrl")) %>%
select("ORF", "RMPSR", "intCtrlOrNot") %>%
#select("ORF", "RMPSR") %>%
ggplot() +
geom_density(aes(x=RMPSR, color = intCtrlOrNot)) +
theme_bw() +
theme(text = element_text(size = 13),
legend.position = c(0.6, 0.6),
legend.background = element_blank(),
axis.ticks.y = element_blank(),
plot.margin = margin(r = 0, unit = "pt"),
panel.grid = element_blank()) +
labs(x = "Rel. mean protein synthesis rate") +
#scale_color_manual(values = c("RMVPS"="black")) +
scale_color_manual(values = c("intCtrl"="blue", "nonCtrl"="black")) +
scale_x_log10() +
geom_vline(xintercept = 1, linetype = "dashed")
figS0_l

write_rds(figS0_l, "../figures/figS0_l.rds")
Fig S1
trial_mRNAcount <- read_feather("../../simulations/trialmRNAcountData/trial_mRNAcount.feather")
trial_mRNAcount
figureS1 <- allSimInputOutput %>%
left_join(., trial_mRNAcount[,c("paraCombo","ORF","trialRMMC")], by = c("paraCombo"="paraCombo", "ORF"="ORF")) %>%
filter(paraCombo != "mRNAconstant") %>%
select(paraCombo, RMMC, trialRMMC, dc, r) %>%
`colnames<-`(c("paraCombo", "AfterScaling", "BeforeScaling", "dc", "r")) %>%
pivot_longer(names_to = "key", values_to = "RMMCvalue", cols = 2:3) %>%
ggplot(aes(x=RMMCvalue, color=key)) +
geom_density() +
facet_grid(dc~r, labeller=labeller(dc=c("1"="100%", "0.8"="80%", "0.6"="60%", "0.4"="40%", "0.2"="20%", "0"="Co-trns 0%"), r=c("0"="Ribo prot indx = 0", "0.1"="0.1", "0.4"="0.4", "1"="1"), label_parsed)) +
labs(title = "Fig S1: mRNA counts when varying are laregely equal to when they are constant \nafter scaling the mRNA synthesis rates",
x="Relative mean mRNA count") +
scale_y_continuous() +
theme_bw() +
theme(text=element_text(size=13),
legend.title = element_blank(),
legend.position = "bottom")
figureS1

write_rds(figureS1, "../figures/figureS1.rds")
#ggsave(paste0(figureBaseFolder, "figures1/s_fig_1.png"), dpi=100, height = 6, width = 8)
###########################################################
allSimInputOutput %>%
filter(paraCombo != "mRNAconstant") %>%
select(paraCombo, RMMC, dc, r) %>%
ggplot(aes(x = RMMC)) +
geom_density() +
facet_grid(dc~r, labeller=labeller(dc=c("1"="100%", "0.8"="80%", "0.6"="60%", "0.4"="40%", "0.2"="20%", "0"="Co-trns 0%"), r=c("0"="Ribo prot indx = 0", "0.1"="0.1", "0.4"="0.4", "1"="1"), label_parsed)) +
labs(x="Relative mean mRNA count after scaling") +
scale_y_continuous() +
theme_bw() +
theme(text=element_text(size=13),
legend.title = element_blank(),
legend.position = "none") +
geom_vline(xintercept = 1, linetype = "dashed")

###########################################################
allSimInputOutput %>%
filter(paraCombo != "mRNAconstant") %>%
select(paraCombo, RMMC, dc, r, geneLength_codon) %>%
mutate(sORl = ifelse(geneLength_codon >=512, "long", "short")) %>%
ggplot(aes(x=RMMC, color=sORl)) +
geom_density() +
facet_grid(dc~r, labeller=labeller(dc=c("1"="100%", "0.8"="80%", "0.6"="60%", "0.4"="40%", "0.2"="20%", "0"="Co-trns 0%"), r=c("0"="Ribo prot indx = 0", "0.1"="0.1", "0.4"="0.4", "1"="1"), label_parsed)) +
labs(x="Relative mean mRNA count") +
scale_y_continuous() +
theme_bw() +
theme(legend.title = element_blank(),
legend.position = "bottom",
strip.text.x = element_text(size=10),
strip.text.y = element_text(size=10))

###########################################################
allSimInputOutput %>%
filter(paraCombo != "mRNAconstant") %>%
select(paraCombo, RMMC, dc, r, mRNADecRateNeymotin_sec) %>%
mutate(fORs = ifelse(mRNADecRateNeymotin_sec >=0.0009431628, "fast", "slow")) %>%
ggplot(aes(x=RMMC, color=fORs)) +
geom_density() +
facet_grid(dc~r, labeller=labeller(dc=c("1"="100%", "0.8"="80%", "0.6"="60%", "0.4"="40%", "0.2"="20%", "0"="Co-trns 0%"), r=c("0"="Ribo prot indx = 0", "0.1"="0.1", "0.4"="0.4", "1"="1"), label_parsed)) +
labs(x="Relative mean mRNA count") +
scale_y_continuous() +
theme_bw() +
theme(legend.title = element_blank(),
legend.position = "bottom",
strip.text.x = element_text(size=10),
strip.text.y = element_text(size=10))

allSimInputOutput%>%
filter(ORF!="YER053C-A", mRNADecRateNeymotin_sec!=0, paraCombo!="mRNAconstant") %>%
mutate(dc_fct=factor(dc, levels=c("1", "0.8", "0.6", "0.4", "0.2", "0"))) %>%
ggplot(aes(x=dc_fct, y=RMMC, fill=r)) +
geom_boxplot(outlier.size = 0.1) +
# geom_hline(aes(yintercept=median(as.numeric(unlist(allSimInputOutput%>%filter(ORF!="YER053C-A", mRNADecRateNeymotin_sec!=0, paraCombo=="dc_1_r_0")%>%select(RMMDR))), na.rm = TRUE)), color="red", linetype="dashed") +
theme_bw() +
labs(x="CMD level",
y="Relative mean mRNA count") +
scale_x_discrete(labels=c("1"="100%", "0.8"="80%", "0.6"="60%", "0.4"="40%", "0.2"="20%", "0"="0")) +
scale_fill_discrete(name = "Ribosome\nprot index") +
theme(
text = element_text(size = 13),
legend.position = "none"
)

allSimInputOutput %>%
group_by(paraCombo) %>%
summarise(M = mean(RMMC)) %>%
arrange(desc(M))
allSimInputOutput %>%
group_by(dc) %>%
summarise(M = mean(RMMC)) %>%
arrange(desc(M))
NA
Fig. was S3, now S2
figureS2 <- allSimInputOutput %>%
filter(paraCombo != "mRNAconstant", ORF != "YER053C-A", mRNADecRateNeymotin_sec != 0) %>%
ggplot(aes(x = MMC, y = MVMC)) +
geom_point(size = 0.5) +
geom_abline(linetype = "dashed") +
facet_grid(dc~r, labeller = labeller(dc = c("1" = "100%", "0.8" = "80%", "0.6" = "60%", "0.4" = "40%", "0.2" = "20%", "0" = "Co-trns 0%"), r = c("0" = "Ribo prot indx = 0", "0.1" = "0.1", "0.4" = "0.4", "1" = "1"), label_parsed)) +
theme_bw() +
theme(text = element_text(size = 13),
legend.position = "none",
plot.margin = margin(r = 0, unit = "pt"),
panel.grid = element_blank()
) +
labs(x = 'Mean of mRNA count',
y = 'Variance of mRNA count') +
geom_smooth(method = "lm") +
stat_cor(aes(label = paste(..r.label.., sep = "~`,`~")), label.x.npc = 0.7, label.y.npc = 0.4, size = 5) +
scale_x_log10() +
scale_y_log10()
figureS2
`geom_smooth()` using formula 'y ~ x'

write_rds(figureS2, "../figures/figureS2.rds")
was Fig S4, now S3: Sequence features correlate with the fano factor of protein synthesis rates for mRNA constant
plot_fun1 <- function(var1, var2){ allSimInputOutput%>% #var1:"MeanProteinSynRate".. var2:"mRNAconstant", "dc_1_r_0"
filter(paraCombo == var2, mRNADecRateNeymotin_sec != 0) %>%
select(ORF, MPSR, MVPS, iniProb_log10, mRNAabundance_log10, mRNADecRateNeymotin_sec_log10, CAI, geneLength_codon_log10) %>%
mutate(fano_protSyn = MVPS/MPSR) %>%
filter(fano_protSyn>0.3) %>% # filter out the two outliers
`colnames<-`(paste0("",c("ORF", "MeanProteinSynRate", "VarianceProteinSynRate", "iniProb_log10", "mRNALevel_log10", "DecRate_log10", "CAI", "geneLength_log10", "fano_protSynRate"))) %>%
pivot_longer(names_to = "feature", values_to = "featureVals", !c(ORF,MeanProteinSynRate, VarianceProteinSynRate, fano_protSynRate)) %>%
ggplot(aes_string(x = "featureVals", y = var1)) +
geom_point(size = 0.5) +
facet_wrap(~feature, scales = "free", nrow = 1, strip.position = "bottom") +
theme_bw() +
geom_smooth(method = "lm") +
stat_cor(aes(label = paste(..r.label.., sep = "~`,`~")), label.x.npc = 0.4, label.y.npc = 0.13, size = 3) +
labs(x = "",
y = var1) +
scale_y_log10() +
theme(text = element_text(size = 13),
strip.text = element_text(color = "black"), # can't use element_blank() here because it gives error when p1+p2
strip.background = element_blank(),
strip.placement = "outside" #to put the strip labels below x-axis
)
}
figureS3 <- plot_fun1("fano_protSynRate", "mRNAconstant")
figureS3
`geom_smooth()` using formula 'y ~ x'

write_rds(figureS3, "../figures/figureS3.rds")
Was Fig S5, now S4.
# MMDP = mRNAs marked for degradation proportion among mean total mRNA
figureS4 <- allSimInputOutput %>%
filter(paraCombo == "dc_1_r_0", mRNADecRateNeymotin_sec != 0) %>%
ggplot(aes(x = MMDP, y = RMPSR)) +
geom_point(size = 0.1) +
scale_x_log10() +
scale_y_log10() +
labs(x = "Proportion of mRNA marked for decay",
y = "Relative mean of protein synthesis rates",
title = "") +
geom_smooth(method = "lm") +
stat_cor(aes(label = paste(..r.label.., sep = "~`,`~")), label.x.npc = 0.1, label.y.npc = 0.3, size = 3) +
theme_bw() +
theme(text=element_text(size = 13))
figureS4
`geom_smooth()` using formula 'y ~ x'

write_rds(figureS4, "../figures/figureS4.rds")
Fig. S5
figureS5 <- allSimInputOutput %>%
filter(paraCombo=="dc_1_r_0", ORF!="YER053C-A", mRNADecRateNeymotin_sec!=0) %>%
select("ORF", "CVPS", "CVMC", "paraCombo") %>% #remove the gene with the 450min HL
ggplot(aes(x=CVMC, y=CVPS, colour=paraCombo)) +
geom_point(size = 0.5) +
geom_abline(linetype="dashed") +
theme_bw() +
theme(text = element_text(size = 13),
legend.position = "none",
strip.text = element_text(color="white"), # can't use element_blank() here because it gives error when p1+p2
plot.margin = margin(r = 0, unit = "pt"),
panel.grid = element_blank()
) +
labs(x ="CV for mRNA count per min",
y = "CV for protein synthesis rate") +
#scale_color_discrete(name="",labels=c("Co-trans 100% RiboProtect 0")) +
geom_smooth(method="lm") +
stat_cor(aes(label=paste(..r.label.., sep = "~`, `~")), label.x.npc = 0.5, label.y.npc = 0.3, size=5) +
scale_x_log10() + # not able to add the inset if i keep the log scales for either x or y
scale_y_log10() +
scale_color_manual(name="", labels=c("Co-trans 100% RiboProtect 0"), values = c("dc_1_r_0" = "black"))
figureS5
`geom_smooth()` using formula 'y ~ x'

write_rds(figureS5, "../figures/figureS5.rds")
Fig S6: relative CV = CV of the protein synthesis rate/CV of the mRNA count
figureS6 <- allSimInputOutput %>%
filter(paraCombo == "dc_1_r_0", mRNADecRateNeymotin_sec != 0, ORF != "YCR024C-B") %>% #"YCR024C-B" is an outlier whose relCV = 23
mutate(relCV = CVPS/CVMC) %>%
select(ORF, relCV, iniProb_log10, mRNAabundance_log10, mRNADecRateNeymotin_sec_log10, CAI, geneLength_codon_log10) %>%
`colnames<-`(paste0("", c("ORF", "Relative_CV", "iniProb_log10", "mRNALevel_log10", "DecRate_log10", "CAI", "geneLength_log10"))) %>%
pivot_longer(names_to = "feature", values_to = "featureVals", -c(ORF, Relative_CV)) %>%
ggplot(aes(x = featureVals, y = Relative_CV)) +
geom_point(size = 0.5) +
facet_wrap(~feature, scales = "free", nrow = 1, strip.position = "bottom") +
theme_bw() +
geom_smooth(method = "lm") +
stat_cor(aes(label = paste(..r.label.., sep = "~`,`~")), label.x.npc = 0.15, label.y.npc = 0.8, size = 3) +
labs(x = "",
y = "Relative CV") +
scale_y_log10() +
theme(text = element_text(size = 13),
strip.text = element_text(color = "black"), # can't use element_blank() here because it gives error when p1+p2
strip.background = element_blank(),
strip.placement = "outside") #to put the strip labels below x-axis
figureS6
`geom_smooth()` using formula 'y ~ x'

write_rds(figureS6, "../figures/figureS6.rds")
Fig. S7:
figureS7 <- allSimInputOutput %>%
filter(paraCombo == "dc_1_r_0", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B") %>%
select(MTT, MMDP, geneLength_codon, RMMDR) %>%
`colnames<-` (c("MeanTransTime", "mRNAMarkdDecProp", "geneLength_codon", "RelativeDecRate")) %>%
pivot_longer(names_to = "feature", values_to = "featureVals", !geneLength_codon) %>%
ggplot(aes(x = featureVals, y = geneLength_codon)) +
geom_point(size = 0.1) +
facet_wrap(~feature, scales = "free_x", nrow = 1, strip.position = "bottom") +
scale_x_log10() +
scale_y_log10() +
labs(x = "",
y = "Gene length (codon)",
title = "dc_1_r_0") +
geom_smooth(method = "lm") +
stat_cor(aes(label = paste(..r.label.., sep = "~`, `~")), label.x.npc = 0.3, label.y.npc = 0.1, size = 3) +
theme_bw() +
theme(text = element_text(size = 13),
strip.text = element_text(color = "black"), # can't use element_blank() here because it gives error when p1+p2
strip.background = element_blank(),
strip.placement = "outside")
figureS7
`geom_smooth()` using formula 'y ~ x'

write_rds(figureS7, "../figures/figureS7.rds")
###################################################
allSimInputOutput %>%
filter(paraCombo == "dc_1_r_1", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A",ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B") %>%
select(MTT, MMDP, geneLength_codon, RMMDR) %>%
`colnames<-` (c("MeanTransTime", "mRNAMarkdDecProp", "geneLength_codon", "RelativeDecRate")) %>%
pivot_longer(names_to = "feature", values_to = "featureVals", !geneLength_codon) %>%
ggplot(aes(x = featureVals, y = geneLength_codon)) +
geom_point(size = 0.1) +
facet_wrap(~feature, scales = "free_x", nrow = 1, strip.position = "bottom") +
scale_x_log10() +
scale_y_log10() +
labs(x = "",
y = "Gene length (codon)",
title = "dc_1_r_1") +
geom_smooth(method = "lm") +
stat_cor(aes(label = paste(..r.label.., sep = "~`,`~")), label.x.npc = 0.3, label.y.npc = 0.1, size = 3) +
theme_bw() +
theme(text = element_text(size = 13),
strip.text = element_text(color = "black"), # can't use element_blank() here because it gives error when p1+p2
strip.background = element_blank(),
strip.placement = "outside")
`geom_smooth()` using formula 'y ~ x'

tmp <- allSimInputOutput %>%
filter(paraCombo == "dc_1_r_0", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A",ORF != "YGR169C-A", ORF != "YLR106C",ORF != "YCR024C-B") %>%
mutate(RDR = MMDR/mRNADecRateNeymotin_sec) %>%
select(RMTE, geneLength_codon, RDR)
summary(lm(RMTE~geneLength_codon+RDR, tmp))
Call:
lm(formula = RMTE ~ geneLength_codon + RDR, data = tmp)
Residuals:
Min 1Q Median 3Q Max
-0.080870 -0.005794 0.000774 0.008152 0.075226
Coefficients:
Estimate Std. Error t value Pr(>|t|)
(Intercept) 4.320e-01 9.835e-03 43.92 <2e-16 ***
geneLength_codon -2.947e-05 1.010e-06 -29.18 <2e-16 ***
RDR 6.010e-01 9.869e-03 60.90 <2e-16 ***
---
Signif. codes: 0 ‘***’ 0.001 ‘**’ 0.01 ‘*’ 0.05 ‘.’ 0.1 ‘ ’ 1
Residual standard error: 0.01439 on 4801 degrees of freedom
Multiple R-squared: 0.8319, Adjusted R-squared: 0.8319
F-statistic: 1.188e+04 on 2 and 4801 DF, p-value: < 2.2e-16
# MMDP = mRNAs marked for degradation proportion among mean total mRNA
# MTT = mean translation time
allSimInputOutput %>%
filter(paraCombo == "dc_1_r_0", mRNADecRateNeymotin_sec != 0) %>%
ggplot(aes(x = MTT, y = MMDP)) +
geom_point(size = 0.1) +
scale_x_log10() +
scale_y_log10() +
labs(x = "Mean translation time",
y = "Proportion of mRNA marked for decay",
title = "") +
geom_smooth(method = "lm") +
stat_cor(aes(label = paste(..r.label.., sep = "~`, `~")), label.x.npc = 0.1, label.y.npc = 0.3, size = 3) +
theme_bw()
`geom_smooth()` using formula 'y ~ x'

allSimInputOutput %>%
filter(paraCombo == "dc_0.2_r_0", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B") %>%
select(MTT, MMDP, geneLength_codon, RMMDR) %>%
`colnames<-` (c("MeanTransTime", "mRNAMarkdDecProp", "geneLength_codon", "RelativeDecRate")) %>%
pivot_longer(names_to = "feature", values_to = "featureVals", !geneLength_codon) %>%
ggplot(aes(x = featureVals, y = geneLength_codon)) +
geom_point(size = 0.1) +
facet_wrap(~feature, scales = "free_x", nrow = 1, strip.position = "bottom") +
scale_x_log10() +
scale_y_log10() +
labs(x = "",
y = "Gene length (codon)",
title = "dc_0.2_r_0") +
geom_smooth(method = "lm") +
stat_cor(aes(label = paste(..r.label.., sep = "~`,`~")), label.x.npc = 0.3, label.y.npc = 0.1, size = 3) +
theme_bw() +
theme(text = element_text(size = 13),
strip.text = element_text(color = "black"), # can't use element_blank() here because it gives error when p1+p2
strip.background = element_blank(),
strip.placement = "outside")
`geom_smooth()` using formula 'y ~ x'

allSimInputOutput %>%
filter(paraCombo == "dc_0.2_r_1", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B") %>%
select(MTT, MMDP, geneLength_codon, RMMDR) %>%
`colnames<-` (c("MeanTransTime", "mRNAMarkdDecProp", "geneLength_codon", "RelativeDecRate")) %>%
pivot_longer(names_to = "feature", values_to = "featureVals", !geneLength_codon) %>%
ggplot(aes(x = featureVals, y = geneLength_codon)) +
geom_point(size = 0.1) +
facet_wrap(~feature, scales = "free_x", nrow = 1, strip.position = "bottom") +
scale_x_log10() +
scale_y_log10() +
labs(x = "",
y = "Gene length (codon)",
title = "dc_0.2_r_1") +
geom_smooth(method = "lm") +
stat_cor(aes(label = paste(..r.label.., sep = "~`, `~")), label.x.npc = 0.3, label.y.npc = 0.1, size = 3) +
theme_bw() +
theme(text = element_text(size = 13),
strip.text = element_text(color = "black"), # can't use element_blank() here because it gives error when p1+p2
strip.background = element_blank(),
strip.placement = "outside")
Warning: Transformation introduced infinite values in continuous x-axis
Warning: Transformation introduced infinite values in continuous x-axis
Warning: Transformation introduced infinite values in continuous x-axis
`geom_smooth()` using formula 'y ~ x'
Warning: Removed 1 rows containing non-finite values (stat_smooth).
Warning: Removed 1 rows containing non-finite values (stat_cor).

Fig. S8
figureS8 <- allSimInputOutput %>%
filter(paraCombo == "dc_1_r_0", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B") %>%
select(RMTE, MTT, MMDP, geneLength_codon, RMMDR) %>%
`colnames<-` (c("RelMeanTE", "MeanTransTime", "mRNAMarkdDecProp", "geneLength_codon", "RelativeDecRate")) %>%
pivot_longer(names_to = "feature", values_to = "featureVals", !RelMeanTE) %>%
ggplot(aes(x = featureVals, y = RelMeanTE)) +
geom_point(size = 0.1) +
facet_wrap(~feature, scales = "free_x", nrow = 1, strip.position = "bottom") +
scale_x_log10() +
scale_y_log10() +
labs(x = "",
y = "Relative mean TE",
title = "dc_1_r_0") +
geom_smooth(method = "lm") +
stat_cor(aes(label = paste(..r.label.., sep = "~`, `~")), label.x.npc = 0.3, label.y.npc = 0.1, size = 3) +
theme_bw() +
theme(text = element_text(size = 13),
axis.text.x = element_text(size = rel(0.8)),
strip.text = element_text(color = "black"), # can't use element_blank() here because it gives error when p1+p2
strip.background = element_blank(),
strip.placement = "outside")
figureS8
`geom_smooth()` using formula 'y ~ x'

write_rds(figureS8, "../figures/figureS8.rds")
#############################################
allSimInputOutput %>%
filter(paraCombo == "dc_0.8_r_0", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B") %>%
select(RMTE, MTT, MMDP, geneLength_codon, RMMDR) %>%
`colnames<-` (c("RelMeanTE", "MeanTransTime", "mRNAMarkdDecProp", "geneLength_codon", "RelativeDecRate")) %>%
pivot_longer(names_to = "feature", values_to = "featureVals", !RelMeanTE) %>%
ggplot(aes(x = featureVals, y = RelMeanTE)) +
geom_point(size = 0.1) +
facet_wrap(~feature, scales = "free_x", nrow = 1, strip.position = "bottom") +
scale_x_log10() +
scale_y_log10() +
labs(x = "",
y = "Relative mean TE",
title = "dc_0.8_r_0") +
geom_smooth(method = "lm") +
stat_cor(aes(label = paste(..r.label.., sep = "~`, `~")), label.x.npc = 0.3, label.y.npc = 0.1, size = 3) +
theme_bw() +
theme(text = element_text(size = 13),
axis.text.x = element_text(size = rel(0.8)),
strip.text = element_text(color = "black"), # can't use element_blank() here because it gives error when p1+p2
strip.background = element_blank(),
strip.placement = "outside")
`geom_smooth()` using formula 'y ~ x'

allSimInputOutput %>%
filter(paraCombo == "dc_0.6_r_0", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B") %>%
select(RMTE, MTT, MMDP, geneLength_codon, RMMDR) %>%
`colnames<-` (c("RelMeanTE", "MeanTransTime", "mRNAMarkdDecProp", "geneLength_codon", "RelativeDecRate")) %>%
pivot_longer(names_to = "feature", values_to = "featureVals", !RelMeanTE) %>%
ggplot(aes(x = featureVals, y = RelMeanTE)) +
geom_point(size = 0.1) +
facet_wrap(~feature, scales = "free_x", nrow = 1, strip.position = "bottom") +
scale_x_log10() +
scale_y_log10() +
labs(x = "",
y = "Relative mean TE",
title = "dc_0.6_r_0") +
geom_smooth(method = "lm") +
stat_cor(aes(label = paste(..r.label.., sep = "~`, `~")), label.x.npc = 0.3, label.y.npc = 0.1, size = 3) +
theme_bw() +
theme(text = element_text(size = 13),
axis.text.x = element_text(size = rel(0.8)),
strip.text = element_text(color = "black"), # can't use element_blank() here because it gives error when p1+p2
strip.background = element_blank(),
strip.placement = "outside")
`geom_smooth()` using formula 'y ~ x'

allSimInputOutput %>%
filter(paraCombo == "dc_0.4_r_0", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B") %>%
select(RMTE, MTT, MMDP, geneLength_codon, RMMDR) %>%
`colnames<-` (c("RelMeanTE", "MeanTransTime", "mRNAMarkdDecProp", "geneLength_codon", "RelativeDecRate")) %>%
pivot_longer(names_to = "feature", values_to = "featureVals", !RelMeanTE) %>%
ggplot(aes(x = featureVals, y = RelMeanTE)) +
geom_point(size = 0.1) +
facet_wrap(~feature, scales = "free_x", nrow = 1,strip.position = "bottom") +
scale_x_log10() +
scale_y_log10() +
labs(x = "",
y = "Relative mean TE",
title = "dc_0.4_r_0") +
geom_smooth(method = "lm") +
stat_cor(aes(label = paste(..r.label.., sep = "~`, `~")), label.x.npc = 0.3, label.y.npc = 0.1, size = 3) +
theme_bw() +
theme(text = element_text(size = 13),
axis.text.x = element_text(size = rel(0.8)),
strip.text = element_text(color = "black"), # can't use element_blank() here because it gives error when p1+p2
strip.background = element_blank(),
strip.placement = "outside")
`geom_smooth()` using formula 'y ~ x'

allSimInputOutput %>%
filter(paraCombo == "dc_0.2_r_0", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B") %>%
select(RMTE, MTT, MMDP, geneLength_codon, RMMDR) %>%
`colnames<-` (c("RelMeanTE", "MeanTransTime", "mRNAMarkdDecProp", "geneLength_codon", "RelativeDecRate")) %>%
pivot_longer(names_to = "feature", values_to = "featureVals", !RelMeanTE) %>%
ggplot(aes(x = featureVals, y = RelMeanTE)) +
geom_point(size = 0.1) +
facet_wrap(~feature, scales = "free_x", nrow = 1, strip.position = "bottom") +
scale_x_log10() +
scale_y_log10() +
labs(x = "",
y = "Relative mean TE",
title = "dc_0.2_r_0") +
geom_smooth(method = "lm") +
stat_cor(aes(label = paste(..r.label.., sep = "~`, `~")), label.x.npc = 0.3, label.y.npc = 0.1, size = 3) +
theme_bw() +
theme(text = element_text(size = 13),
axis.text.x = element_text(size = rel(0.8)),
strip.text = element_text(color = "black"), # can't use element_blank() here because it gives error when p1+p2
strip.background = element_blank(),
strip.placement = "outside")
`geom_smooth()` using formula 'y ~ x'

allSimInputOutput %>%
filter(paraCombo == "dc_0_r_0", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B") %>%
select(RMTE, MTT, MMDP, geneLength_codon, RMMDR) %>%
`colnames<-` (c("RelMeanTE", "MeanTransTime", "mRNAMarkdDecProp", "geneLength_codon", "RelativeDecRate")) %>%
pivot_longer(names_to = "feature", values_to = "featureVals", !RelMeanTE) %>%
ggplot(aes(x = featureVals, y = RelMeanTE)) +
geom_point(size = 0.1) +
facet_wrap(~feature, scales = "free_x", nrow = 1, strip.position = "bottom") +
scale_x_log10() +
scale_y_log10() +
labs(x = "",
y = "Relative mean TE",
title = "dc_0_r_0") +
geom_smooth(method = "lm") +
stat_cor(aes(label = paste(..r.label.., sep = "~`, `~")), label.x.npc = 0.3, label.y.npc = 0.1, size = 3) +
theme_bw() +
theme(text = element_text(size = 13),
axis.text.x = element_text(size = rel(0.8)),
strip.text = element_text(color="black"), # can't use element_blank() here because it gives error when p1+p2
strip.background = element_blank(),
strip.placement = "outside")
Warning: Transformation introduced infinite values in continuous x-axis
Warning: Transformation introduced infinite values in continuous x-axis
Warning: Transformation introduced infinite values in continuous x-axis
`geom_smooth()` using formula 'y ~ x'
Warning: Removed 4804 rows containing non-finite values (stat_smooth).
Warning: Removed 4804 rows containing non-finite values (stat_cor).

allSimInputOutput %>%
filter(paraCombo == "dc_1_r_1", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B") %>%
select(RMTE, MTT, MMDP, geneLength_codon, RMMDR) %>%
`colnames<-` (c("RelMeanTE", "MeanTransTime", "mRNAMarkdDecProp", "geneLength_codon", "RelativeDecRate")) %>%
pivot_longer(names_to = "feature", values_to = "featureVals", !RelMeanTE) %>%
ggplot(aes(x = featureVals, y = RelMeanTE)) +
geom_point(size = 0.1) +
facet_wrap(~feature, scales = "free_x", nrow = 1, strip.position = "bottom") +
scale_x_log10() +
scale_y_log10() +
labs(x = "",
y = "Relative mean TE",
title = "dc_1_r_1") +
geom_smooth(method = "lm") +
stat_cor(aes(label = paste(..r.label.., sep = "~`, `~")), label.x.npc = 0.3, label.y.npc = 0.1, size = 3) +
theme_bw() +
theme(text=element_text(size = 13),
axis.text.x = element_text(size = rel(0.8)),
strip.text = element_text(color = "black"), # can't use element_blank() here because it gives error when p1+p2
strip.background = element_blank(),
strip.placement = "outside")
`geom_smooth()` using formula 'y ~ x'

allSimInputOutput %>%
filter(paraCombo == "dc_0.2_r_1", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B") %>%
select(RMTE, MTT, MMDP, geneLength_codon, RMMDR) %>%
`colnames<-` (c("RelMeanTE", "MeanTransTime", "mRNAMarkdDecProp", "geneLength_codon", "RelativeDecRate")) %>%
pivot_longer(names_to = "feature", values_to = "featureVals", !RelMeanTE) %>%
ggplot(aes(x = featureVals, y = RelMeanTE)) +
geom_point(size = 0.1) +
facet_wrap(~feature, scales = "free_x", nrow = 1, strip.position = "bottom") +
scale_x_log10() +
scale_y_log10() +
labs(x = "",
y = "Relative mean TE",
title = "dc_0.2_r_1") +
geom_smooth(method = "lm") +
stat_cor(aes(label = paste(..r.label.., sep = "~`, `~")), label.x.npc = 0.3, label.y.npc = 0.1, size = 3) +
theme_bw() +
theme(text = element_text(size = 13),
axis.text.x = element_text(size = rel(0.8)),
strip.text = element_text(color = "black"), # can't use element_blank() here because it gives error when p1+p2
strip.background = element_blank(),
strip.placement = "outside")
Warning: Transformation introduced infinite values in continuous x-axis
Warning: Transformation introduced infinite values in continuous x-axis
Warning: Transformation introduced infinite values in continuous x-axis
`geom_smooth()` using formula 'y ~ x'
Warning: Removed 1 rows containing non-finite values (stat_smooth).
Warning: Removed 1 rows containing non-finite values (stat_cor).

allSimInputOutput %>%
filter(paraCombo == "dc_1_r_0", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B") %>%
select(MMDP, RMMDR) %>%
ggplot(aes(x = MMDP, y = RMMDR)) +
geom_point(size = 0.1) +
labs(x = "MMDP",
y = "Relative decay rates",
title = "dc_1_r_0") +
geom_smooth(method = "lm") +
stat_cor(aes(label = paste(..r.label.., sep = "~`, `~")), label.x.npc = 0.3, label.y.npc = 0.1, size = 3) +
theme_bw() +
theme(text = element_text(size = 13),
axis.text.x = element_text(size = rel(0.8)),
strip.text = element_text(color = "black"), # can't use element_blank() here because it gives error when p1+p2
strip.background = element_blank(),
strip.placement = "outside")
`geom_smooth()` using formula 'y ~ x'

# MMDP = mRNAs marked for degradation proportion
allSimInputOutput %>%
filter(paraCombo == "dc_0.2_r_0", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B") %>%
select(MMDP, RMMDR) %>%
ggplot(aes(x = MMDP, y = RMMDR)) +
geom_point(size = 0.1) +
scale_x_log10() +
scale_y_log10() +
labs(x = "MMDP",
y = "Relative decay rates",
title = "dc_0.2_r_0") +
geom_smooth(method = "lm") +
stat_cor(aes(label = paste(..r.label.., sep = "~`, `~")), label.x.npc = 0.3, label.y.npc = 0.1, size = 3) +
theme_bw() +
theme(text = element_text(size = 13),
axis.text.x = element_text(size = rel(0.8)),
strip.text = element_text(color = "black"), # can't use element_blank() here because it gives error when p1+p2
strip.background = element_blank(),
strip.placement = "outside")
`geom_smooth()` using formula 'y ~ x'

Fig. S9
figureS9 <- allSimInputOutput %>%
filter(paraCombo != "mRNAconstant", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B", dc != 0) %>%
#select(RMTE, MTT, MMDP, geneLength_codon, RMMDR) %>%
ggplot(aes(x = MMDP, y = RMTE)) +
geom_point(size = 0.1) +
facet_grid(dc~r, labeller = labeller(dc = c("1" = "100%", "0.8" = "80%", "0.6" = "60%", "0.4" = "40%", "0.2" = "Co-trns 20%"), r = c("0" = "Ribo prot indx = 0", "0.1" = "0.1", "0.4" = "0.4", "1" = "1"), label_parsed)) +
theme_bw() +
theme(text = element_text(size = 13),
legend.position = "none",
plot.margin = margin(r = 0, unit = "pt"),
panel.grid = element_blank()
) +
labs(x = 'Proportions of mRNAs undergoing CMD for all genes',
y = 'Relative mean translation efficiencies') +
geom_smooth(method = "lm") +
stat_cor(aes(label = paste(..r.label.., sep = "~`,`~")), label.x.npc = 0.2, label.y.npc = 0.4, size = 5) +
scale_x_log10() +
scale_y_log10()
figureS9
Warning: Transformation introduced infinite values in continuous x-axis
Warning: Transformation introduced infinite values in continuous x-axis
Warning: Transformation introduced infinite values in continuous x-axis
`geom_smooth()` using formula 'y ~ x'
Warning: Removed 1 rows containing non-finite values (stat_smooth).
Warning: Removed 1 rows containing non-finite values (stat_cor).

write_rds(figureS9, "../figures/figureS9.rds")
##############################################################
allSimInputOutput %>%
filter(paraCombo != "mRNAconstant", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B", , r==0|r==1, dc==0.2|dc==1) %>%
#select(RMTE, MTT, MMDP, geneLength_codon, RMMDR) %>%
ggplot(aes(x = MMDP, y = RMTE)) +
geom_point(size = 0.1) +
facet_grid(dc~r, labeller = labeller(dc = c("1" = "100%", "0.8" = "80%", "0.6" = "60%", "0.4" = "40%", "0.2" = "Co-trns 20%"), r = c("0" = "Ribo prot indx = 0", "0.1" = "0.1", "0.4" = "0.4", "1" = "1"), label_parsed)) +
theme_bw() +
theme(text = element_text(size = 13),
legend.position = "none",
plot.margin = margin(r = 0, unit = "pt"),
panel.grid = element_blank()
) +
labs(x = 'Proportions of mRNAs undergoing CMD for all genes',
y = 'Relative mean translation efficiencies') +
geom_smooth(method = "lm") +
stat_cor(aes(label = paste(..r.label.., sep = "~`,`~")), label.x.npc = 0.2, label.y.npc = 0.4, size = 5) +
scale_x_log10() +
scale_y_log10()
Warning: Transformation introduced infinite values in continuous x-axis
Warning: Transformation introduced infinite values in continuous x-axis
Warning: Transformation introduced infinite values in continuous x-axis
`geom_smooth()` using formula 'y ~ x'
Warning: Removed 1 rows containing non-finite values (stat_smooth).
Warning: Removed 1 rows containing non-finite values (stat_cor).

Fig. S10
figureS10 <- allSimInputOutput %>%
filter(paraCombo != "mRNAconstant", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B") %>%
#select(RMTE, MTT, MMDP, geneLength_codon, RMMDR) %>%
ggplot(aes(x = RMMDR, y = RMTE)) +
geom_point(size = 0.1) +
facet_grid(dc~r, labeller = labeller(dc = c("1" = "100%", "0.8" = "80%", "0.6" = "60%", "0.4" = "40%", "0.2" = "20%", "0" = "Co-trns 0%"), r = c("0" = "Ribo prot indx = 0", "0.1" = "0.1", "0.4" = "0.4", "1" = "1"), label_parsed)) +
theme_bw() +
theme(text = element_text(size = 13),
legend.position = "none",
plot.margin = margin(r = 0, unit = "pt"),
panel.grid = element_blank()
) +
labs(x = 'Relative mRNA decay rates',
y = 'Relative mean translation efficiencies') +
geom_smooth(method = "lm") +
stat_cor(aes(label = paste(..r.label.., sep = "~`,`~")), label.x.npc = 0.2, label.y.npc = 0.4, size = 5) +
scale_x_log10() +
scale_y_log10()
figureS10
`geom_smooth()` using formula 'y ~ x'

write_rds(figureS10, "../figures/figureS10.rds")
#########################################################
allSimInputOutput %>%
filter(paraCombo != "mRNAconstant", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B", r==0|r==1, dc==0|dc==1) %>%
#select(RMTE, MTT, MMDP, geneLength_codon, RMMDR) %>%
ggplot(aes(x = RMMDR, y = RMTE)) +
geom_point(size = 0.1) +
facet_grid(dc~r, labeller = labeller(dc = c("1" = "100%", "0.8" = "80%", "0.6" = "60%", "0.4" = "40%", "0.2" = "20%", "0" = "Co-trns 0%"), r = c("0" = "Ribo prot indx = 0", "0.1" = "0.1", "0.4" = "0.4", "1" = "1"), label_parsed)) +
theme_bw() +
theme(text = element_text(size = 13),
legend.position = "none",
plot.margin = margin(r = 0, unit = "pt"),
panel.grid = element_blank()
) +
labs(x = 'Relative mRNA decay rates',
y = 'Relative mean translation efficiencies') +
geom_smooth(method = "lm") +
stat_cor(aes(label = paste(..r.label.., sep = "~`,`~")), label.x.npc = 0.2, label.y.npc = 0.4, size = 5) +
scale_x_log10() +
scale_y_log10()
`geom_smooth()` using formula 'y ~ x'

was Fig. S9, maybe should not use it coz the vline calculated from its input decay rate may not be accurate.
lifetimeDistri<- function(genevec){
dfplot <- cbind(dc.r.df[c(2:5, 22:25), ], data.frame(matrix(NA, ncol = 5000, nrow = 8*3))) %>%
mutate(ORF = c(rep(genevec[1], 8), rep(genevec[2], 8), rep(genevec[3], 8))) %>%
relocate(ORF)
for(i in 1:8){dfplot[i, 6:5005] = as.vector(h5read(simOutputH5, paste0(genevec[1], "/mRNA_lifeTimes/", dfplot$paraCombo[i])))}
for(i in 9:16){dfplot[i, 6:5005] = as.vector(h5read(simOutputH5, paste0(genevec[2], "/mRNA_lifeTimes/", dfplot$paraCombo[i])))}
for(i in 17:24){dfplot[i, 6:5005] = as.vector(h5read(simOutputH5, paste0(genevec[3], "/mRNA_lifeTimes/", dfplot$paraCombo[i])))}
dfplot %>%
pivot_longer(names_to = "varyingParaCombo", values_to = "lifeTimes", cols = 6:5005) %>%
ggplot(aes(lifeTimes, fill = dc)) +
geom_density(alpha = 0.5, color = NA) +
facet_grid(factor(ORF, levels = genevec)~r,
labeller = labeller(r = c("0" = "Ribo prot index 0", "0.1" = "0.1", "0.4" = "0.4", "1" = "1"))) +
scale_x_log10(labels = scales::comma_format(accuracy = 1L)) +
scale_fill_discrete(name = "CMD level",
labels = c("0" = "0", "0.2" = "20%", "0.6" = "60%", "1" = "100%")) +
theme_bw() +
labs(x = paste0("mRNA life time distribution (log10)")) +
theme(
legend.position = "top",
legend.justification = "left",
text = element_text(size = 13),
axis.text.x = element_text(size = 8)) +
geom_vline(data = filter(dfplot, ORF == genevec[1]), aes(xintercept = 1/simInputFeatures$mRNADecRateNeymotin_sec[which(simInputFeatures$ORF == genevec[1])]), linetype = "dashed", color = "dark grey") + #1049.856 =1/simInputFeatures$mRNADecRateNeymotin_sec[1] # 1049.856 is the input lifetime for YAL001C
geom_vline(data = filter(dfplot, ORF == genevec[2]), aes(xintercept = 1/simInputFeatures$mRNADecRateNeymotin_sec[which(simInputFeatures$ORF == genevec[2])]), linetype = "dashed", color = "dark grey") +
geom_vline(data = filter(dfplot, ORF == genevec[3]), aes(xintercept = 1/simInputFeatures$mRNADecRateNeymotin_sec[which(simInputFeatures$ORF == genevec[3])]), linetype = "dashed", color = "dark grey")
# the above lines are the average life time calculated from input decay rates
}
lifetimeDistri(c("YAL001C", "YKR075C", "YBR011C"))

lifetimeDistri(c("YLR106C", "YKR054C", "YHR099W")) # longest genes
Warning: Removed 6188 rows containing non-finite values (stat_density).

lifetimeDistri(c("YAR002C-A", "YBL050W", "YBR003W"))

allSimInputOutput %>%
filter(paraCombo == "dc_0_r_0", mRNADecRateNeymotin_sec != 0, mRNAabundance>1, ORF!="YER053C-A", ORF!="YLR106C") %>% #remove the gene with HL=450min, also an outlier gene "YLR106C" with RMTE==0.6
select(ORF, paraCombo, RMTE, mRNAabundance_log10, iniProb_log10, mRNADecRateNeymotin_sec_log10, CAI, geneLength_codon_log10) %>%
`colnames<-`(c("ORF", "paraCombo", "RMTE", "log(mRNAabundance)", "log(IniProb)", "log(DecRate)", "CAI", "log(Length)")) %>%
pivot_longer(cols = -c(RMTE, paraCombo, ORF), names_to = "feature", values_to = "featureVal") %>%
ggplot(aes(x=featureVal, y=RMTE, color=paraCombo)) +
geom_point(size=0.5) +
facet_wrap(~feature, scales = "free", nrow=1, strip.position = "bottom") +
theme_bw() +
scale_y_log10() +
theme(text = element_text(size = 13),
legend.position = "none",
strip.text = element_text(color="black", size=rel(1.2)), # can't use element_blank() here because it gives error when p1+p2
plot.margin = margin(r = 0, unit = "pt"),
panel.grid = element_blank(),
strip.background = element_blank(),
strip.placement = "outside" #to put the strip labels below x-axis
) +
labs(x = "",
y = "Relative mean translation efficiency",
title = "dc_0_r_0") +
geom_smooth(method="lm") +
stat_cor(aes(label=paste(..r.label.., sep = "~`,`~")), label.x.npc = 0.3, label.y.npc = 0.2, size=5) +
scale_color_manual(name="", labels=c(""), values = c("dc_1_r_0" = "#1F78B4"))
allSimInputOutput %>%
filter(paraCombo == "dc_0_r_1", mRNADecRateNeymotin_sec != 0, mRNAabundance>1, ORF!="YER053C-A", ORF!="YLR106C") %>% #remove the gene with HL=450min, also an outlier gene "YLR106C" with RMTE==0.6
select(ORF, paraCombo, RMTE, mRNAabundance_log10, iniProb_log10, mRNADecRateNeymotin_sec_log10, CAI, geneLength_codon_log10) %>%
`colnames<-`(c("ORF", "paraCombo", "RMTE", "log(mRNAabundance)", "log(IniProb)", "log(DecRate)", "CAI", "log(Length)")) %>%
pivot_longer(cols = -c(RMTE, paraCombo, ORF), names_to = "feature", values_to = "featureVal") %>%
ggplot(aes(x=featureVal, y=RMTE, color=paraCombo)) +
geom_point(size=0.5) +
facet_wrap(~feature, scales = "free", nrow=1, strip.position = "bottom") +
theme_bw() +
scale_y_log10() +
theme(text = element_text(size = 13),
legend.position = "none",
strip.text = element_text(color="black", size=rel(1.2)), # can't use element_blank() here because it gives error when p1+p2
plot.margin = margin(r = 0, unit = "pt"),
panel.grid = element_blank(),
strip.background = element_blank(),
strip.placement = "outside" #to put the strip labels below x-axis
) +
labs(x = "",
y = "Relative mean translation efficiency",
title = "dc_0_r_1") +
geom_smooth(method="lm") +
stat_cor(aes(label=paste(..r.label.., sep = "~`,`~")), label.x.npc = 0.3, label.y.npc = 0.2, size=5) +
scale_color_manual(name="", labels=c(""), values = c("dc_1_r_0" = "#1F78B4"))
allSimInputOutput %>%
filter(paraCombo == "dc_1_r_1", mRNADecRateNeymotin_sec != 0, mRNAabundance>1, ORF!="YER053C-A", ORF!="YLR106C") %>% #remove the gene with HL=450min, also an outlier gene "YLR106C" with RMTE==0.6
select(ORF, paraCombo, RMTE, mRNAabundance_log10, iniProb_log10, mRNADecRateNeymotin_sec_log10, CAI, geneLength_codon_log10) %>%
`colnames<-`(c("ORF", "paraCombo", "RMTE", "log(mRNAabundance)", "log(IniProb)", "log(DecRate)", "CAI", "log(Length)")) %>%
pivot_longer(cols = -c(RMTE, paraCombo, ORF), names_to = "feature", values_to = "featureVal") %>%
ggplot(aes(x=featureVal, y=RMTE, color=paraCombo)) +
geom_point(size=0.5) +
facet_wrap(~feature, scales = "free", nrow=1, strip.position = "bottom") +
theme_bw() +
scale_y_log10() +
theme(text = element_text(size = 13),
legend.position = "none",
strip.text = element_text(color="black", size=rel(1.2)), # can't use element_blank() here because it gives error when p1+p2
plot.margin = margin(r = 0, unit = "pt"),
panel.grid = element_blank(),
strip.background = element_blank(),
strip.placement = "outside" #to put the strip labels below x-axis
) +
labs(x = "",
y = "Relative mean translation efficiency",
title = "dc_1_r_1") +
geom_smooth(method="lm") +
stat_cor(aes(label=paste(..r.label.., sep = "~`,`~")), label.x.npc = 0.3, label.y.npc = 0.2, size=5) +
scale_color_manual(name="", labels=c(""), values = c("dc_1_r_0" = "#1F78B4"))
tmpdf <- data.frame(lifetime = log10(as.numeric(dfplot[1, 6:5005])))
which.max(density(tmpdf$lifetime)$y)
density(tmpdf$lifetime)$x[387]
ggplot(tmpdf, aes(lifetime)) + geom_density() + geom_vline(xintercept = density(tmpdf$lifetime)$x[387])
Fig. S
NOTES: Output decay rate = 1/mean lifetime https://en.wikipedia.org/wiki/Particle_decay
Total output decay rate = output decay rate * output mean mRNA count
Total input decay rate = input decay rate * mRNAabundance
Total synthesis rate = a scaled constant
(The above rates are all gene-specific)
Summary: changing total output decay rate is a result of changing co-translational decay and ribosome protection. In order to maintain the constant mRNA level, we have to scale the total synthesis rates to counter-effect the changing output decay rates.
When co-translational decay is higher than 0, there’s always a surplus of mRNAs marked for decay, that are not accounted when calculating total decay probabilities (They’re not accounted because they already have decay machinery bound to them, so cannot be accounted again into the mRNA pool that can still be degraded). Therefore the synthesis rates are scaled, in order to maintain a stable relative mRNA count (= mean output mRNA count/mRNAabundance) for it to be close to 1 (Supp Fig 1). The mean output mRNA count for each gene is a result of the balance between its scaled synthesis rate and total output decay rate. In other words, the total output decay rate directly respond to the scaled synthesis rate, rather than the input decay rate.
The scaled total synthesis rates are the smallest when co-translational decay = 100%, so that the total real-time mRNA count can be close to mRNAabundance even with the highest amount of mRNAs marked for decay. In contrast, the scaled total synthesis rates are the largest and equal to the total input decay rates when co-trans decay = 0% (Supp Fig 2a), because there is 0 mRNA marked for decay.
Hypothetically, the total output decay rates should equal to the total synthesis rates in order to maintain the real-time mRNA count to be largely the same at the beginning and the end of the simulation. If unequal, the real-time mRNA count should either go up or down as the simulation continues compared to the begining amount (i.e. mRNAabundance). However, our results show that the total output decay rates are slightly larger than the scaled synthesis rates across all the parameter combos (Supp Fig 2b. this is the part I don’t understand, is it coz the total output decay rates include considering mRNAsMarkedForDecay, but the total scaled synthesis rates doesn’t include mRNAsMarkedForDecay), and that’s somehow contributing to the mean real-time mRNA count being equal to mRNAabundance as shown in Supp Fig 1.
Because the output decay rates directly respond to total synthesis rates, they are influenced by the para combos in the same way that total synthesis rates are. That explains why Supp Fig 2c is similar to Supp Fig 2a in that the peaks skew to the right as co-translational decay ratio goes down. However in Supp Fig 2a, the ratio (scaled synthesis rates V.S. total input decay rates) skewed from less than 1 to 1; while in Supp Fig 2c, the ratio (total output decay rates V.S. total input decay rates) skewed from 1 to larger than 1. This would make sense if we can explain what’s going on in Supp Fig 2b.
Meanwhile, the output decay rates for short genes are much less affected by different co-translational decay proportions than long genes (Supp Fig 2d). This should be a reflection that the total synthesis rates for short genes are changing less with changing co-translational decay.
Supp Fig 2a: The scaled synthesis rates are the smallest when co-trans decay = 100%, while theythe largest and equal to the total input decay rates when co-trans decay = 0%
Supp Fig 2b: Total output mRNA decay rates are slightly larger than scaled mRNA synthesis rates , but the ratio stays stable with changing parameters (I don’t understand why the decay rates have to be larger)
Supp Fig 2c: Output decay rates respond to scaled synthesis rates, therefore its ratio against input decay rates shows similar patter as scaled synthesis rates in Fig 2
Supp Fig 2d: Output decay rates for short genes are much less affected by different -translational decay than long genes
allSimInputOutput_trial <- read_feather("../../../exp0/externalData/exp11_outcomeAll.feather")
tmp <- allSimInputOutput_trial %>%
filter(combo != "mRNAconstant", w != 0.01, w != 0.05, w != 0.2) %>%
select(NMMC, combo, ORF, r, w) %>% # NMMC in trial = RMMC in exp0, "normalized" VS "relative"
mutate(dc=1-as.numeric(r)) %>%
select(-r) %>% #delete the original column named "r", in trial data the r means CMD levels, and w means ribosome protection index
dplyr::rename("r"="w", "paraCombo"="combo", "RMMCtrial"="NMMC") %>% # change the original col named "w" into "r", b/c "r" in exp0 means ribosome protection index
mutate(paraCombo=paste0("dc_", dc, "_r_", r)) %>%
select(-dc, -r)
sup1 <- (allSimInputOutput %>%
filter(paraCombo != "mRNAconstant") %>%
left_join(., tmp, by = c("paraCombo"="paraCombo", "ORF"="ORF"))) %>%
select("paraCombo", "RMMC", "RMMCtrial", "dc", "r") %>%
dplyr::rename("AfterScaling"="RMMC", "BeforeScaling"="RMMCtrial") %>%
pivot_longer(names_to = "key", values_to = "RMMCvalue", cols = 2:3) %>%
ggplot(aes(x=RMMCvalue, color=key)) +
geom_density() +
facet_grid(dc~r, labeller=labeller(dc=c("0"="0%", "0.2"="20%", "0.4"="40%", "0.6"="60%", "0.8"="80%", "1"="CMD 100%"), r=c("0"="Ribo prot indx = 0", "0.1"="0.1", "0.4"="0.4", "1"="1"), label_parsed)) +
labs(title = "Sup Fig 1: mRNA counts when varying are laregely equal to when they are constant \nafter scaling the mRNA synthesis rates",
x="Relative mean mRNA count") +
scale_y_continuous() +
geom_vline(xintercept =1, linetype="dashed", color="dark grey") +
theme_bw() +
theme(legend.title = element_blank(),
legend.position = "bottom",
strip.text.x = element_text(size=10),
strip.text.y = element_text(size=10)) # make the gridline color darker
############################################ plotting the (total syn rate after scaling)/(input decay rate*mRNAabundance) for all genes for all rw combos
outdf <- tibble(matrix(NA, ncol=nrow(dc.r.df)-1, nrow=4839))
for (i in 1:(nrow(dc.r.df)-1))
{
inf <- read.table(paste0("../../simulations/simInput/allGenesDecrEqualsSynrWithScaling_", dc.r.df$paraCombo[i+1], "_S.cer.mRNA.ini.abndc.syn.dec.tsv"))
outdf[, i] <- inf[, 3]/(inf[, 4]*inf[, 2])
}
colnames(outdf) <- dc.r.df$paraCombo[2:nrow(dc.r.df)]
sup2a <- outdf %>%
pivot_longer(names_to = "paraCombo", values_to = "value", cols = 1:(nrow(dc.r.df)-1)) %>%
left_join(., dc.r.df, by = "paraCombo") %>%
filter(value != 0, paraCombo == "dc_1_r_0"|paraCombo == "dc_0_r_0"|paraCombo == "dc_1_r_1"|paraCombo == "dc_0_r_1") %>%
ggplot(aes(x=value)) +
geom_density() +
facet_grid(dc~r, labeller=labeller(dc=c("0"="0%", "0.2"="20%", "0.4"="40%", "0.6"="60%", "0.8"="80%", "1"="CMD 100%"), r=c("0"="Ribo prot indx = 0", "0.1"="0.1", "0.4"="0.4", "1"="1"), label_parsed)) +
geom_vline(xintercept =1, linetype="dashed", color="dark grey") +
labs(title = "",
x="Scaled synthesis rates/Total input decay rates") +
theme_bw() +
theme(strip.text.x = element_text(size=9),
strip.text.y = element_blank()) +
scale_x_continuous(breaks = c(0.9, 1, 1.1, 1.3, 1.5))
############################################## plotting the (output decay rate)/(syn rate after scaling) for all genes for all dc/r paraCombos
mmdrAllgeneAlldcr <- read_feather("../calculatedMetrics/mmdrAllgeneAlldcr.feather")[, 2:nrow(dc.r.df)]
mmcAllgeneAlldcr<- read_feather("../calculatedMetrics/mmcAllgeneAlldcr.feather")[, 2:nrow(dc.r.df)]
totdr <- mmdrAllgeneAlldcr*mmcAllgeneAlldcr
totsynr <- tibble(matrix(NA, ncol=nrow(dc.r.df)-1, nrow=4839))
for (i in 1:(nrow(dc.r.df)-1))
{
inf <- read.table(paste0("../../simulations/simInput/allGenesDecrEqualsSynrWithScaling_", dc.r.df$paraCombo[i+1], "_S.cer.mRNA.ini.abndc.syn.dec.tsv"))
totsynr[, i] <- inf[, 3]
}
ratio.dr.synr <- totdr/totsynr
colnames(ratio.dr.synr) <- dc.r.df$paraCombo[2:nrow(dc.r.df)]
ratio.dr.synr <- ratio.dr.synr[-1278, ] # gene with the HL-min=490 min, the data point skews the scale
sup2b <- ratio.dr.synr %>%
pivot_longer(names_to = "paraCombo", values_to = "value", cols = 1:(nrow(dc.r.df)-1)) %>%
left_join(., dc.r.df, by = "paraCombo") %>%
filter(paraCombo == "dc_1_r_0"|paraCombo == "dc_0_r_0"|paraCombo == "dc_1_r_1"|paraCombo == "dc_0_r_1") %>%
filter(!is.na(value)) %>%
ggplot(aes(x=value)) +
geom_density() +
facet_grid(dc~r, labeller=labeller(dc=c("0"="0%", "0.2"="20%", "0.4"="40%", "0.6"="60%", "0.8"="80%", "1"="CMD 100%"), r=c("0"="Ribo prot indx = 0", "0.1"="0.1", "0.4"="0.4", "1"="1"), label_parsed)) +
labs(title = "",
x="Total output decay rates/Scaled synthesis rates") +
geom_vline(xintercept =1, linetype="dashed", color="dark grey") +
theme_bw() +
theme(strip.text.x = element_text(size=9),
strip.text.y = element_text(size=9),
axis.title.y = element_blank())
############################################ plotting the (output decay rate*real time mRNA)/(input decay rate*mRNAabundance)for all genes for all rw combos
outdf <- tibble(matrix(NA, ncol=nrow(dc.r.df)-1, nrow=4839)) #contains all the total input decay rates
for (i in 1:(nrow(dc.r.df)-1)) # these 16 columns are all the same, all equal to simInputFeatures$mRNAabundance*simInputFeatures$mRNADecRateNeymotin_sec
{
inf <- read.table(paste0("../../simulations/simInput/allGenesDecrEqualsSynrWithScaling_", dc.r.df$paraCombo[i+1], "_S.cer.mRNA.ini.abndc.syn.dec.tsv"))
outdf[, i] <- (inf[, 4]*inf[, 2])
}
outdf <- totdr/outdf
colnames(outdf) <- dc.r.df$paraCombo[2:nrow(dc.r.df)]
sup2c <- outdf[-1278, ] %>% # gene with the HL-min=490 min, the data point skews the scales
pivot_longer(names_to = "paraCombo", values_to = "value", cols = 1:(nrow(dc.r.df)-1)) %>%
left_join(., dc.r.df, by = "paraCombo") %>%
filter(value != 0, paraCombo == "dc_1_r_0"|paraCombo == "dc_0_r_0"|paraCombo == "dc_1_r_1"|paraCombo == "dc_0_r_1") %>%
ggplot(aes(x=value)) +
geom_density() +
facet_grid(dc~r, labeller=labeller(dc=c("0"="0%", "0.2"="20%", "0.4"="40%", "0.6"="60%", "0.8"="80%", "1"="CMD 100%"), r=c("0"="Ribo prot indx = 0", "0.1"="0.1", "0.4"="0.4", "1"="1"), label_parsed)) +
geom_vline(xintercept =1, linetype="dashed", color="dark grey") +
labs(title = "",
x="Total output decay rates/Total input decay rates") +
theme_bw() +
theme(#strip.text.x = element_text(size=8),
strip.text.y = element_blank(),
strip.text.x = element_blank()) # hide the grid title
############################################
# sl = short or long
outdf$sl <- rep(NA,4839)
outdf$sl[which(simInputFeatures$geneLength_codon>512)] <- "Long"
outdf$sl[which(simInputFeatures$geneLength_codon<=512)] <- "Short"
sup2d <- outdf[-1278, ] %>% # took the gene with the HL-min=490 min, the data point skews the scales
pivot_longer(names_to = "paraCombo", values_to = "value", cols = 1:(nrow(dc.r.df)-1)) %>%
left_join(., dc.r.df, by = "paraCombo") %>%
filter(value != 0, paraCombo == "dc_1_r_0"|paraCombo == "dc_0_r_0"|paraCombo == "dc_1_r_1"|paraCombo == "dc_0_r_1") %>%
ggplot(aes(x=value, color=sl, group=sl)) +
geom_density() +
facet_grid(dc~r, labeller=labeller(dc=c("0"="0%", "0.2"="20%", "0.4"="40%", "0.6"="60%", "0.8"="80%", "1"="CMD 100%"), r=c("0"="Ribo prot indx = 0", "0.1"="0.1", "0.4"="0.4", "1"="1"), label_parsed)) +
labs(title = "",
x="Total output decay rates/Total input decay rates") +
geom_vline(xintercept =1, linetype="dashed", color="dark grey") +
theme_bw() +
theme(
strip.text.y = element_text(size=9),
strip.text.x = element_blank(),
legend.position = c(0.9, 0.95),
axis.title.y = element_blank(),
legend.background=element_blank(), # change the legend background to transparent
legend.key.size = unit(0.5, "line")) +
scale_color_discrete(name = "", labels = )
############################################
sup1
sup2 <- (sup2a|sup2b)/(sup2c|sup2d)
sup2 + plot_annotation(
title = 'Supp Fig 2.',
# subtitle = 'Supp Fig 2.',
# caption = 'Hello', # this one appears at the bottom
tag_levels = 'a'
)
####################################
tot.in.dr <- tibble(matrix(NA, ncol=nrow(dc.r.df)-1, nrow=4839)) #contains all the total input decay rates
for (i in 1:(nrow(dc.r.df)-1)) # these 16 columns are all the same, all equal to simInputFeatures$mRNAabundance*simInputFeatures$mRNADecRateNeymotin_sec
{
inf <- read.table(paste0(basefolder, expID, "/input/allGenesDecrEqualsSynrWithScaling_", dc.r.df$paraCombo[i+1], "_S.cer.mRNA.ini.abndc.syn.dec"))
tot.in.dr[, i] <- (inf[, 4]*inf[, 2])
}
mmdrAllgeneAlldcr <- read_feather(paste0(basefolder, expID, "/analyses/featherFiles/mmdrAllgeneAlldcr.feather"))[, 2:nrow(dc.r.df)]
mmcAllgeneAlldcr<- read_feather(paste0(basefolder, expID, "/analyses/featherFiles/mmcAllgeneAlldcr.feather"))[, 2:nrow(dc.r.df)]
tot.out.dr <- mmdrAllgeneAlldcr*mmcAllgeneAlldcr
outdf <- tot.out.dr/tot.in.dr
colnames(outdf) <- dc.r.df$paraCombo[2:nrow(dc.r.df)]
outdf[-1278, ] %>% # gene with the HL-min=490 min, the data point skews the scales
pivot_longer(names_to = "paraCombo", values_to = "outInDrRatio", cols = 1:(nrow(dc.r.df)-1)) %>%
left_join(., dc.r.df, by = "paraCombo") %>%
filter(outInDrRatio != 0) %>%
mutate(dc_fct=factor(dc, levels=c("1", "0.8", "0.6", "0.4", "0.2", "0"))) %>%
ggplot(aes(x=dc_fct, y=outInDrRatio, fill=r)) +
geom_boxplot(outlier.size = 0.1) +
geom_hline(aes(yintercept=median(as.numeric(unlist(outdf %>%select(dc_1_r_0)))[-1278], na.rm = TRUE)),
color="red", linetype="dashed") +
theme_bw() +
labs(x="CMD level",
y="Ratio between total output/input decay rates") +
scale_x_discrete(labels=c("1"="100%", "0.8"="80%", "0.6"="60%", "0.4"="40%", "0.2"="20%", "0"="0")) +
scale_fill_discrete(name = "Ribosome\nprot index") +
theme(
text = element_text(size = 13),
legend.position = "none"
)
##############
outdf <- tibble(matrix(NA, ncol=nrow(dc.r.df)-1, nrow=4839)) #contains all the total input decay rates
for (i in 1:(nrow(dc.r.df)-1)) # these 16 columns are all the same, all equal to simInputFeatures$mRNAabundance*simInputFeatures$mRNADecRateNeymotin_sec
{
inf <- read.table(paste0(basefolder, expID, "/input/allGenesDecrEqualsSynrWithScaling_", dc.r.df$paraCombo[i+1], "_S.cer.mRNA.ini.abndc.syn.dec"))
outdf[, i] <- (inf[, 4]*inf[, 2])
}
outdf <- totdr/outdf
colnames(outdf) <- dc.r.df$paraCombo[2:nrow(dc.r.df)]
outdf %>%
mutate(mRNAabundance=simInputFeatures$mRNAabundance, mRNADecRateNeymotin_sec=simInputFeatures$mRNADecRateNeymotin_sec, ORF=simInputFeatures$ORF) %>%
pivot_longer(names_to = "paraCombo", values_to = "ratioVal", cols = !c(mRNAabundance, mRNADecRateNeymotin_sec, ORF)) %>%
filter(paraCombo == "dc_0_r_1", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A") %>%
ggplot(aes(x=mRNAabundance, y=ratioVal)) +
geom_point() +
theme_bw() +
scale_x_log10()
Fig. S
l %>%
filter(paraCombo == "dc_1_r_0", mRNADecRateNeymotin_sec != 0, ORF != "YCR024C-B", mRNAabundance != 1) %>%
mutate(relativeFano = RMVPS/RMPSR) %>%
ggplot(aes(x=RMPSR, y=relativeFano)) +
geom_point(size=0.1) +
scale_x_log10() +
scale_y_log10() +
labs(x= "Realtive mean protein synthesis rate",
y = "Relative fano factor in protein synthesis rate",
title = "") +
geom_smooth(method="lm") +
stat_cor(aes(label=paste(..r.label.., sep = "~`, `~")), label.x.npc = 0.1, label.y.npc = 0.3, size=3) +
theme_bw()
allSimInputOutput %>%
filter(paraCombo == "dc_1_r_0", mRNADecRateNeymotin_sec != 0, ORF != "YCR024C-B", mRNAabundance != 1) %>%
ggplot(aes(x=MRD, y=RMVTE)) +
geom_point(size=0.1) +
scale_x_log10() +
scale_y_log10() +
labs(x= "Mean ribosome density",
y = "Relative mean of variance in translation efficiency",
title = "") +
geom_smooth(method="lm") +
stat_cor(aes(label=paste(..r.label.., sep = "~`, `~")), label.x.npc = 0.1, label.y.npc = 0.3, size=3) +
theme_bw()
allSimInputOutput %>%
filter(paraCombo == "dc_1_r_0", mRNADecRateNeymotin_sec != 0, ORF != "YCR024C-B", mRNAabundance != 1) %>%
ggplot(aes(x=MMDP, y=mRNADecRateNeymotin_sec)) +
geom_point(size=0.1) +
scale_x_log10() +
scale_y_log10() +
labs(x= "Mean ribosome density",
y = "Relative mean of variance in translation efficiency",
title = "") +
geom_smooth(method="lm") +
stat_cor(aes(label=paste(..r.label.., sep = "~`, `~")), label.x.npc = 0.1, label.y.npc = 0.3, size=3) +
theme_bw()
Figure S.
# calculating the mean number of free ribos (averaged over simuTime and techReps) for all dc.r.paraCombos
# RMFR = relative mean free ribo
mfr <- c()
for(i in 1:nrow(dc.r.df)) # loop through the dc/r parameter space to calculate the mean free ribo
{
# free_ribo averaged by simuTime and techReps
mfr <- c(mfr, mean(h5read(simOutputH5, paste("free_ribo_tRNA_perMin", dc.r.df$paraCombo[i], "ribo", sep="/")), na.rm = TRUE))
# set na.rm=T because in rep 66 again there's an NA at the last minute, which won't affect the overall mean
}
rmfr <- mfr/mfr[1]
rmfr_df <- data.frame(RMFR = rmfr,
MFR = mfr,
para = dc.r.df$para)
# rmfr_df can be found in exp0_prepPlots.Rmd
rmfr_df %>%
left_join(., dc.r.df, by ="para") %>%
filter(paraCombo != "mRNAconstant") %>%
select(RMFR, dc, r) %>%
spread(dc, RMFR) %>%
select(-r) %>%
colMeans() %>%
tibble() %>%
mutate(dc=as.character(seq(0, 1, by=0.2))) %>%
`colnames<-`(c("RMFRmeanByCoTrans", "dc")) %>%
mutate(cotrans = paste0(as.numeric(dc)*100, "%")) %>%
ggplot(aes(x=cotrans, y=RMFRmeanByCoTrans)) +
geom_point() +
theme_bw() +
labs ( title = "",
x ="Co-translational decay proportion",
y = "Mean free ribosomes (relative to mRNA constant)") +
theme(text = element_text(size = 13),
panel.grid = element_blank()) +
scale_x_discrete(limits = c("100%", "80%", "60%", "40%", "20%", "0%"))
make_heatmap <- function(orderVar, outputVar, legendName, titleY)
{
colorvec <- quantile(allSimInputOutput[[outputVar]])
tmp <- (allSimInputOutput%>%filter(paraCombo == "dc_1_r_0"))[, c("ORF", orderVar)]
tmp <- tmp[order(tmp[, 2], decreasing = T), ]
tmp$newid_dc1r0 <- 1:4839
allSimInputOutput %>%
filter(paraCombo != "mRNAconstant") %>%
left_join(., tmp[, c("ORF", "newid_dc1r0")], by = "ORF") %>%
mutate(dc_fct=factor(dc, levels=c("1", "0.8", "0.6", "0.4", "0.2", "0"))) %>%
ggplot(aes_string(x = "r",
y = "factor(newid_dc1r0)",
fill = outputVar)) +
geom_raster() +
theme_bw() +
scale_fill_gradientn(colours = c("#377eb8", "white", "#e41a1c"), # blue white red
values = scales::rescale(colorvec), name=legendName) +
facet_wrap(~dc_fct, nrow=1, labeller=labeller(dc_fct=c("1"="Co-trans 100%", "0.8"="80%", "0.6"="60%", "0.4"="40%", "0.2"="20%", "0"="0"))) +
labs ( x = "Ribosome protection index r",
y = titleY,
title = "") +
theme(text = element_text(size = 18),
axis.text.y = element_blank(),
axis.ticks.y = element_blank(),
panel.border = element_blank(), # remove the grid lines in facet_grid
panel.spacing=unit(0, "lines")) + # reset the spacing between facets
guides(fill = guide_colourbar(barwidth = 1, barheight = 10)) +
scale_x_discrete(expand = c(0, 0)) # remove the extra space beyond xlim
}
# 1st var= the variable column the sorting is based on
# 2nd var= the variable column presented in the heatmap
# 3rd var= the legend text
# 4th var= y-axis title
make_heatmap("RMTE", "RMTE", "Relative\nmean translation\nefficiency", "Genes ranked by the first column")
make_heatmap("RMVTE", "RMVTE", "Relative mean\nof the variance\nin translation\nefficiency", "Genes ranked by the first column")
########################################################## add a plot for mRNAs marked for decay
colorvec <- quantile((allSimInputOutput%>% filter(paraCombo != "mRNAconstant", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A"))$MMDP)
tmp <- (allSimInputOutput%>%filter(paraCombo == "dc_1_r_0"))[, c("ORF", "RMTE")]
tmp <- tmp[order(tmp[, 2], decreasing = T), ]
tmp$newid_dc1r0 <- 1:4839
allSimInputOutput %>%
mutate(dc_fct=factor(dc, levels=c("1", "0.8", "0.6", "0.4", "0.2", "0"))) %>%
filter(paraCombo != "mRNAconstant", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", dc != 0) %>%
left_join(., tmp[, c("ORF", "newid_dc1r0")], by = "ORF") %>%
ggplot(aes(x = r,
y = factor(newid_dc1r0),
#y = as.character(newid_geneLength_codon), # genes are sorted by geneLength_codon within each group
fill = MMDP)) +
geom_raster() +
theme_bw() +
scale_fill_gradientn(colours = c("#377eb8", "white", "#e41a1c"), # blue white red
values = scales::rescale(colorvec), name="mRNAs marked\nfor decay ratio") +
facet_wrap(~dc_fct, nrow=1, labeller=labeller(dc_fct=c("1"="Co-trans 100%", "0.8"="80%", "0.6"="60%", "0.4"="40%", "0.2"="20%", "0"="0%"))) +
labs ( x = "Ribosome protection index w",
y = "Genes ranked by the first column in translation efficiency plot",
title = "") +
theme(text = element_text(size = 18),
plot.title = element_text(size=rel(1.5)),
axis.text.y = element_blank(),
axis.ticks.y = element_blank(),
panel.border = element_blank(), # remove the grid lines in facet_grid
panel.spacing=unit(0, "lines")) + # reset the spacing between facets
guides(fill = guide_colourbar(barwidth = 1, barheight = 10)) +
scale_x_discrete(expand = c(0, 0)) # remove the extra space beyond xlim
########################################################## add another plot for mRNAs marked for decay
colorvec <- quantile((allSimInputOutput%>% filter(paraCombo != "mRNAconstant", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A"))$MMDP)
tmp <- (allSimInputOutput%>%filter(paraCombo == "dc_1_r_0"))[, c("ORF", "RMVTE")]
tmp <- tmp[order(tmp[, 2], decreasing = T), ]
tmp$newid_dc1r0 <- 1:4839
allSimInputOutput %>%
mutate(dc_fct=factor(dc, levels=c("1", "0.8", "0.6", "0.4", "0.2", "0"))) %>%
filter(paraCombo != "mRNAconstant", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", dc != 0) %>%
left_join(., tmp[, c("ORF", "newid_dc1r0")], by = "ORF") %>%
ggplot(aes(x = r,
y = factor(newid_dc1r0),
fill = MMDP)) +
geom_raster() +
theme_bw() +
scale_fill_gradientn(colours = c("#377eb8", "white", "#e41a1c"), # blue white red
values = scales::rescale(colorvec), name="mRNAs marked\nfor decay ratio") +
facet_wrap(~dc_fct, nrow=1, labeller=labeller(dc_fct=c("1"="Co-trans 100%", "0.8"="80%", "0.6"="60%", "0.4"="40%", "0.2"="20%", "0"="0%"))) +
labs ( x = "Ribosome protection index w",
y = "Genes ranked by the first column in translation efficiency plot",
title = "") +
theme(text = element_text(size = 18),
plot.title = element_text(size=rel(1.5)),
axis.text.y = element_blank(),
axis.ticks.y = element_blank(),
panel.border = element_blank(), # remove the grid lines in facet_grid
panel.spacing=unit(0, "lines")) + # reset the spacing between facets
guides(fill = guide_colourbar(barwidth = 1, barheight = 10)) +
scale_x_discrete(expand = c(0, 0)) # remove the extra space beyond xlim
# 1st var= the variable column the sorting is based on
# 2nd var= the variable column presented in the heatmap
# 3rd var= the legend text
# 4th var= y-axis title
make_heatmap("RMPSR", "RMPSR", "Relative\nmean protein\nsyn rate", "Genes ranked by the first column")
make_heatmap("RMVPS", "RMVPS", "Relative\nmean of variance in\nprotein syn rate", "Genes ranked by the first column")
make_heatmap_tmp <- function(orderVar, outputVar, legendName, titleY)
{
colorvec <- quantile(allSimInputOutput[[outputVar]])
tmp <- (allSimInputOutput%>%filter(paraCombo == "dc_1_r_0"))[, c("ORF", orderVar)]
tmp <- tmp[order(tmp[, 2], decreasing = T), ]
tmp$newid_dc1r0 <- 1:4839
allSimInputOutput %>%
filter(paraCombo != "mRNAconstant", RMVTBR != Inf) %>%
left_join(.,tmp[, c("ORF", "newid_dc1r0")], by = "ORF") %>%
mutate(dc_fct=factor(dc, levels=c("1", "0.8", "0.6", "0.4", "0.2", "0"))) %>%
ggplot(aes_string(x = "r",
y = "factor(newid_dc1r0)",
fill = outputVar)) +
geom_raster() +
theme_bw() +
scale_fill_gradientn(colours = c("#377eb8", "white", "#e41a1c"), # blue white red
values = scales::rescale(colorvec), name=legendName) +
facet_wrap(~dc_fct, nrow=1, labeller=labeller(dc_fct=c("1"="Co-trans 100%", "0.8"="80%", "0.6"="60%", "0.4"="40%", "0.2"="20%", "0"="0"))) +
labs ( x = "Ribosome protection index r",
y = titleY,
title = "") +
theme(text = element_text(size = 18),
axis.text.y = element_blank(),
axis.ticks.y = element_blank(),
panel.border = element_blank(), # remove the grid lines in facet_grid
panel.spacing=unit(0, "lines")) + # reset the spacing between facets
guides(fill = guide_colourbar(barwidth = 1, barheight = 10)) +
scale_x_discrete(expand = c(0, 0)) # remove the extra space beyond xlim
}
make_heatmap_tmp("RMTE", "RMVTBR", "Relative\nvariance in total\nbound ribosomes", "Genes ranked by the first column in relative TE")
make_heatmap("MML", "MML", "Mean of mRNA\nlife-times", "Genes ranked by the first column")
###############################################################
colorvec <- quantile((allSimInputOutput%>% filter(paraCombo != "mRNAconstant", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A"))$RMRD)
tmp <- (allSimInputOutput%>%filter(paraCombo == "dc_1_r_0"))[, c("ORF", "RMTE")]
tmp <- tmp[order(tmp[, 2], decreasing = T), ]
tmp$newid_dc1r0 <- 1:4839
allSimInputOutput %>%
filter(paraCombo != "mRNAconstant", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A") %>%
left_join(., tmp[, c("ORF", "newid_dc1r0")], by = "ORF") %>%
ggplot(aes(x = r,
y = factor(newid_dc1r0),
fill = RMRD)) +
geom_raster() +
theme_bw() +
scale_fill_gradientn(colours = c("#377eb8", "white", "#e41a1c"), # blue white red
values = scales::rescale(colorvec), name="Relative mean\nribo density") +
facet_wrap(~dc, nrow=1, labeller=labeller(dc=c("1"="Co-trans 100%", "0.8"="0.8", "0.6"="0.6", "0.4"="0.4", "0.2"="0.2", "0"="0"))) +
labs ( x = "Ribosome protection index",
y = "Genes ranked by the first column for translation efficiency",
title = "") +
theme(text = element_text(size = 18),
plot.title = element_text(size=rel(1.5)),
axis.text.y = element_blank(),
axis.ticks.y = element_blank(),
panel.border = element_blank(), # remove the grid lines in facet_grid
panel.spacing=unit(0, "lines")) + # reset the spacing between facets
guides(fill = guide_colourbar(barwidth = 1, barheight = 10)) +
scale_x_discrete(expand = c(0, 0)) # remove the extra space beyond xlim
---
title: "Figures for manuscript"
output:
  pdf_document: default
  html_notebook: default
---

Load libraries and public variables
```{r, include=FALSE} 
# This chunk will be evaluated but the output is suppressed
rmarkdown::render("../../publicVariables/createPublicVariables.Rmd")
```

```{r}
# File that contains simulation output data in a HDF5 directory structure specified in "/publicVariables/createPublicVariables.Rmd"
simOutputH5 <- paste0("../../dataProcessing/simOutputH5Data/", experimentID, "_output.h5")

# A comprehensive table that contains all simulation input and calculated output metrics
allSimInputOutput <- read_feather("../allSimInputOutput.feather")

# This folder contains raw output files from the simulations. This is needed for calculate_para_sp_mcpsr()
rawSimOutFolder <- "/team/batch_SMOTNT/experiment1_output"

# Where figures are stored
figureBaseFolder <- "../figures/"
```

Validation: compare the protein synthesis rates with Weinberg 2016
```{r fig.height=4, fig.width=6}
weinbergData <- read_tsv("../externalData/weinberg_synthesis.txt")

validationPlot <- allSimInputOutput %>% 
  filter(paraCombo == "mRNAconstant") %>% 
  select(ORF, paraCombo, MPSR, dc, r) %>%
  left_join(weinbergData[, c("ORF", "S")], by = "ORF") %>%
  mutate(S_perMin=S*60,
         newcombo=factor(paraCombo, levels=dc.r.df$paraCombo[2:25])) %>%
  ggplot(aes(x=MPSR, y=S_perMin)) +
    geom_abline(linetype="dashed") +
    geom_point() +
    geom_smooth(method="lm") +
    stat_cor(aes(label=paste(..r.label..,  sep = "~`, `~")), label.x.npc = 0.1, label.y.npc = 0.7, size=10) +
    scale_x_log10() +
    scale_y_log10() +
    theme_bw() +
    labs(x="Mean protein synthesis rates for mRNA constant",
         y="Protein synthesis rate estimates by Weinberg et al 2016")

validationPlot

write_rds(validationPlot, "../figures/validationPlot.rds")


tmp <- allSimInputOutput %>% 
    filter(paraCombo == "mRNAconstant") %>% 
    select(ORF, paraCombo, MPSR) %>%
    left_join(weinbergData[, c("ORF", "S")], by = "ORF") %>%
    mutate(S_perMin=S*60) 

# quick try of piping the t test didn't work..
t.test(tmp$S_perMin, tmp$MPSR, paired = TRUE)
```

```{r fig.height=4, fig.width=6}
figS0_a <- allSimInputOutput %>%
    filter(paraCombo=="mRNAconstant"|paraCombo=="dc_1_r_0", ORF!="YER053C-A") %>%
    ggplot(aes(x=MPSR, y=PMPSR, color = paraCombo)) +
    geom_point(size = 0.5) +
    geom_abline(linetype="dashed") +
    theme_bw() +
    theme(text = element_text(size = 13),
              legend.position = "top",
              strip.text = element_text(color="white"),  # can't use element_blank() here because it gives error when p1+p2
              plot.margin = margin(r = 0, unit = "pt"),
              panel.grid = element_blank()
      ) +
        labs(x = 'Mean of protein synthesis rate'~(min^-1),
             y = 'Predicted mean of protein synthesis rate'~(min^-1)) +
        scale_color_manual(name="", labels=c("mRNAconstant"="mRNAconstant", "dc_1_r_0"="mRNAvarying"), values = c("#1F78B4", "#FF7F00")) +
        geom_smooth(method="lm") +
        stat_cor(aes(label=paste(..r.label..,  sep = "~`,`~")), label.x.npc = 0.7, label.y.npc = 0.4, size=5) +
        scale_x_log10() +
        scale_y_log10()

figS0_a
write_rds(figS0_a,"../figures/figS0_a.rds")
######################################################
figS0_b <- allSimInputOutput %>%
    filter(paraCombo=="dc_1_r_0", ORF!="YER053C-A") %>%
    select(paraCombo, ORF, MVPS, PMPSR, mRNASynRateTotal_sec) %>%
    mutate(mRNASynRateTotal_min = mRNASynRateTotal_sec*60,
           additiveVar = PMPSR + mRNASynRateTotal_min,
           multiplicativeVar = PMPSR * mRNASynRateTotal_min + PMPSR^2*mRNASynRateTotal_min + PMPSR*mRNASynRateTotal_min^2) %>% 
    select(ORF, MVPS, additiveVar, multiplicativeVar) %>% 
    pivot_longer(names_to = "predictedVar", values_to = "predictedVarValue", cols = -c(ORF,MVPS)) %>% 
    ggplot(aes(x=MVPS, y=predictedVarValue, color = predictedVar)) +
    geom_point(size = 0.5) +
    geom_abline(linetype="dashed") +
    theme_bw() +
    theme(text = element_text(size = 13),
              legend.position = "top",
              strip.text = element_text(color="white"),  # can't use element_blank() here because it gives error when p1+p2
              plot.margin = margin(r = 0, unit = "pt"),
              panel.grid = element_blank()
      ) +
        labs(x = 'Variance of protein synthesis rate'~(min^-2),
             y = 'Predicted variance of protein synthesis rate'~(min^-2)) +
        scale_color_manual(name="", labels=c("mRNAconstant"="mRNAconstant", "dc_1_r_0"="mRNAvarying"), values = c("#1F78B4", "#FF7F00")) +
        geom_smooth(method="lm") +
        stat_cor(aes(label=paste(..r.label..,  sep = "~`,`~")), label.x.npc = 0.7, label.y.npc = 0.4, size=5) +
        scale_x_log10() +
        scale_y_log10()

figS0_b
write_rds(figS0_b, "../figures/figS0_b.rds")
######################################################
figS0_c <- allSimInputOutput %>%
    filter(paraCombo=="dc_1_r_0", ORF!="YER053C-A") %>%
    select(paraCombo, ORF, MPSR, RMPSR) %>% 
    ggplot(aes(x = MPSR, y = RMPSR)) +
    geom_point(size = 0.5) +
    #geom_abline(linetype="dashed") +
    geom_hline(yintercept = 1, linetype="dashed") +
    theme_bw() +
    theme(text = element_text(size = 13),
              legend.position = "top",
              strip.text = element_text(color="white"),  # can't use element_blank() here because it gives error when p1+p2
              plot.margin = margin(r = 0, unit = "pt"),
              panel.grid = element_blank()
      ) +
        labs(x = 'mean prot syn rate for mRNAvarying'~(min^-1),
             y = 'relative mean prot syn rate for mRNAvarying'~(min^-1)) +
        #scale_color_manual(name="", labels=c("mRNAconstant"="mRNAconstant", "dc_1_r_0"="mRNAvarying"), values = c("#1F78B4", "#FF7F00")) +
        geom_smooth() +
        stat_cor(aes(label=paste(..r.label..,  sep = "~`,`~")), label.x.npc = 0.7, label.y.npc = 0.4, size=5) +
        scale_x_log10() 

figS0_c
write_rds(figS0_c, "../figures/figS0_c.rds")
######################################################
figS0_d <- allSimInputOutput %>%
    filter(paraCombo=="dc_1_r_0", ORF!="YER053C-A") %>%
    select(paraCombo, ORF, MPSR, RMPSR) %>%
    arrange(MPSR) %>% 
    # mutate(binNames = c(unlist(lapply(1:19, function(x){rep(x,254)})), rep(20,12))) %>%  # bin all 4838 genes into 20 bins, each contains same number of genes ordered by their MPSR
    # ggplot(aes(x = factor(binNames, levels = 1:20), y = RMPSR)) +
    mutate(binNames = c(unlist(lapply(1:9, function(x){rep(x,537)})), rep(10,5))) %>%  # bin all 4838 genes into 10 bins, each contains same number of genes ordered by their MPSR
    ggplot(aes(x = factor(binNames, levels = 1:10), y = RMPSR)) +
    geom_boxplot() +
    #geom_abline(linetype="dashed") +
    geom_hline(yintercept = 1, linetype="dashed") +
    theme_bw() +
    theme(text = element_text(size = 13),
              legend.position = "top",
              strip.text = element_text(color="white"),  # can't use element_blank() here because it gives error when p1+p2
              plot.margin = margin(r = 0, unit = "pt"),
              panel.grid = element_blank()
      ) +
        labs(x = 'mean prot syn rate for mRNAvarying'~(min^-1),
             y = 'relative mean prot syn rate for mRNAvarying'~(min^-1)) +
        #scale_color_manual(name="", labels=c("mRNAconstant"="mRNAconstant", "dc_1_r_0"="mRNAvarying"), values = c("#1F78B4", "#FF7F00")) +
        geom_smooth() +
        stat_cor(aes(label=paste(..r.label..,  sep = "~`,`~")), label.x.npc = 0.7, label.y.npc = 0.4, size=5) 

figS0_d
write_rds(figS0_d, "../figures/figS0_d.rds")
######################################################
figS0_e <- allSimInputOutput %>%
    filter(paraCombo=="dc_1_r_0", ORF!="YER053C-A") %>%
    select(paraCombo, ORF, MPSR, RMPSR) %>%
    arrange(MPSR) %>% 
    # mutate(binNames = c(unlist(lapply(1:19, function(x){rep(x,254)})), rep(20,12))) %>%  # bin all 4838 genes into 20 bins, each contains same number of genes ordered by their MPSR
    # ggplot(aes(x = factor(binNames, levels = 1:20), y = RMPSR)) +
    mutate(binNames = c(unlist(lapply(1:9, function(x){rep(x,537)})), rep(10,5))) %>%  # bin all 4838 genes into 10 bins, each contains same number of genes ordered by their MPSR
    group_by(binNames) %>% 
    mutate(test = RMPSR>1) %>% 
    #mutate(freqRMPSRabove1 = sum(test)/n()) %>% 
    summarize(freqRMPSRabove1 = sum(test)/n()) %>% 
    ggplot(aes(x = factor(binNames, levels = 1:10), y = freqRMPSRabove1)) +
    geom_bar(stat='identity') +
    #geom_abline(linetype="dashed") +
    #geom_hline(yintercept = 1, linetype="dashed") +
    theme_bw() +
    theme(text = element_text(size = 13),
              legend.position = "top",
              strip.text = element_text(color="white"),  # can't use element_blank() here because it gives error when p1+p2
              plot.margin = margin(r = 0, unit = "pt"),
              panel.grid = element_blank()
      ) +
        labs(x = 'bins of genes',
             y = 'freq of rel. mean prot syn rate above 1 in each bin')

figS0_e
write_rds(figS0_e, "../figures/figS0_e.rds")
######################################################
figS0_f <- allSimInputOutput %>%
    filter(paraCombo=="dc_1_r_0", ORF!="YER053C-A") %>%
    select(paraCombo, ORF, mRNAabundance, RMPSR) %>% 
    ggplot(aes(x = mRNAabundance, y = RMPSR)) +
    geom_point(size = 0.5) +
    #geom_abline(linetype="dashed") +
    geom_hline(yintercept = 1, linetype="dashed") +
    theme_bw() +
    theme(text = element_text(size = 13),
              legend.position = "top",
              strip.text = element_text(color="white"),  # can't use element_blank() here because it gives error when p1+p2
              plot.margin = margin(r = 0, unit = "pt"),
              panel.grid = element_blank()
      ) +
        labs(x = 'mRNA abundances',
             y = 'relative mean prot syn rate for mRNAvarying'~(min^-1)) +
        #scale_color_manual(name="", labels=c("mRNAconstant"="mRNAconstant", "dc_1_r_0"="mRNAvarying"), values = c("#1F78B4", "#FF7F00")) +
        geom_smooth() +
        stat_cor(aes(label=paste(..r.label..,  sep = "~`,`~")), label.x.npc = 0.7, label.y.npc = 0.4, size=5) +
        scale_x_log10() 

figS0_f
write_rds(figS0_f, "../figures/figS0_f.rds")
######################################################
figS0_g <- allSimInputOutput %>%
    filter(paraCombo=="dc_1_r_0", ORF!="YER053C-A") %>%
    select(paraCombo, ORF, CAI, RMPSR) %>% 
    ggplot(aes(x = CAI, y = RMPSR)) +
    geom_point(size = 0.5) +
    #geom_abline(linetype="dashed") +
    geom_hline(yintercept = 1, linetype="dashed") +
    theme_bw() +
    theme(text = element_text(size = 13),
              legend.position = "top",
              strip.text = element_text(color="white"),  # can't use element_blank() here because it gives error when p1+p2
              plot.margin = margin(r = 0, unit = "pt"),
              panel.grid = element_blank()
      ) +
        labs(x = 'CAI',
             y = 'relative mean prot syn rate for mRNAvarying'~(min^-1)) +
        #scale_color_manual(name="", labels=c("mRNAconstant"="mRNAconstant", "dc_1_r_0"="mRNAvarying"), values = c("#1F78B4", "#FF7F00")) +
        geom_smooth() +
        stat_cor(aes(label=paste(..r.label..,  sep = "~`,`~")), label.x.npc = 0.7, label.y.npc = 0.4, size=5) 

figS0_g
write_rds(figS0_g, "../figures/figS0_g.rds")
######################################################
figS0_h <- allSimInputOutput %>%
    filter(paraCombo=="dc_1_r_0", ORF!="YER053C-A") %>%
    select(paraCombo, ORF, iniProb, RMPSR) %>% 
    ggplot(aes(x = iniProb, y = RMPSR)) +
    geom_point(size = 0.5) +
    #geom_abline(linetype="dashed") +
    geom_hline(yintercept = 1, linetype="dashed") +
    theme_bw() +
    theme(text = element_text(size = 13),
              legend.position = "top",
              strip.text = element_text(color="white"),  # can't use element_blank() here because it gives error when p1+p2
              plot.margin = margin(r = 0, unit = "pt"),
              panel.grid = element_blank()
      ) +
        labs(x = 'translation initiation probability',
             y = 'relative mean prot syn rate for mRNAvarying'~(min^-1)) +
        #scale_color_manual(name="", labels=c("mRNAconstant"="mRNAconstant", "dc_1_r_0"="mRNAvarying"), values = c("#1F78B4", "#FF7F00")) +
        geom_smooth() +
        stat_cor(aes(label=paste(..r.label..,  sep = "~`,`~")), label.x.npc = 0.7, label.y.npc = 0.4, size=5) +
        scale_x_log10() 

figS0_h
write_rds(figS0_h, "../figures/figS0_h.rds")
######################################################
figS0_i <- allSimInputOutput %>%
    filter(paraCombo=="dc_1_r_0", ORF!="YER053C-A") %>%
    #mutate(intCtrlOrNot = ifelse(mRNADecRateNeymotin_sec==0,"intCtrl","nonCtrl")) %>% 
    #select(paraCombo, ORF, geneLength_codon, RMPSR, intCtrlOrNot) %>% 
    select(paraCombo, ORF, geneLength_codon, RMPSR) %>% 
    #ggplot(aes(x = geneLength_codon, y = RMPSR, color = intCtrlOrNot)) +
    ggplot(aes(x = geneLength_codon, y = RMPSR)) +
    geom_point(size = 0.5) +
    #geom_abline(linetype="dashed") +
    geom_hline(yintercept = 1, linetype="dashed") +
    theme_bw() +
    theme(text = element_text(size = 13),
              legend.position = "top",
              strip.text = element_text(color="white"),  # can't use element_blank() here because it gives error when p1+p2
              plot.margin = margin(r = 0, unit = "pt"),
              panel.grid = element_blank()
      ) +
        labs(x = 'gene length (codon)',
             y = 'relative mean prot syn rate for mRNAvarying'~(min^-1)) +
        #scale_color_manual(name="", labels=c("mRNAconstant"="mRNAconstant", "dc_1_r_0"="mRNAvarying"), values = c("#1F78B4", "#FF7F00")) +
        geom_smooth() +
        stat_cor(aes(label=paste(..r.label..,  sep = "~`,`~")), label.x.npc = 0.7, label.y.npc = 0.4, size=5) +
        scale_x_log10() 

figS0_i
write_rds(figS0_i, "../figures/figS0_i.rds")
######################################################
figS0_j <- allSimInputOutput %>%
    filter(paraCombo=="dc_1_r_0", ORF!="YER053C-A") %>%
    select(paraCombo, ORF, mRNADecRateNeymotin_min, RMPSR) %>% 
    ggplot(aes(x = mRNADecRateNeymotin_min, y = RMPSR)) +
    geom_point(size = 0.5) +
    #geom_abline(linetype="dashed") +
    geom_hline(yintercept = 1, linetype="dashed") +
    theme_bw() +
    theme(text = element_text(size = 13),
              legend.position = "top",
              strip.text = element_text(color="white"),  # can't use element_blank() here because it gives error when p1+p2
              plot.margin = margin(r = 0, unit = "pt"),
              panel.grid = element_blank()
      ) +
        labs(x = 'mRNA decay rates from Neymotin data (min)',
             y = 'relative mean prot syn rate for mRNAvarying'~(min^-1)) +
        #scale_color_manual(name="", labels=c("mRNAconstant"="mRNAconstant", "dc_1_r_0"="mRNAvarying"), values = c("#1F78B4", "#FF7F00")) +
        geom_smooth() +
        stat_cor(aes(label=paste(..r.label..,  sep = "~`,`~")), label.x.npc = 0.7, label.y.npc = 0.4, size=5) +
        scale_x_log10() 

figS0_j
write_rds(figS0_j, "../figures/figS0_j.rds")

######################################################
figS0_k <- allSimInputOutput %>%
    filter(paraCombo!= "mRNAconstant") %>% 
    select(dc, r, RMFR) %>% 
    unique() %>% 
    ggplot(aes(x = dc, y = RMFR, color = factor(r))) +
    geom_point() +
    geom_line() +
    # theme_bw() +
    # theme(text = element_text(size = 13),
    #           legend.position = "top",
    #           strip.text = element_text(color="white"),  # can't use element_blank() here because it gives error when p1+p2
    #           plot.margin = margin(r = 0, unit = "pt"),
    #           panel.grid = element_blank()
    #   ) +
        labs(x = 'CMD levels',
             y = 'Relative mean free ribosomes') +
  scale_color_discrete(name = "Ribo protection index")

figS0_k
write_rds(figS0_k, "../figures/figS0_k.rds")


######################################################
figS0_l <- allSimInputOutput %>%
  filter(paraCombo=="dc_0_r_1", ORF!="YER053C-A") %>% #remove the gene with the 450min HL
  # filter(paraCombo=="dc_0_r_1", ORF!="YER053C-A", mRNADecRateNeymotin_sec==0) %>% 
  # select("ORF", "RMPSR", "RMFR") %>% 
  mutate(intCtrlOrNot = ifelse(mRNADecRateNeymotin_sec==0,"intCtrl","nonCtrl")) %>% 
  select("ORF", "RMPSR", "intCtrlOrNot") %>% 
  #select("ORF", "RMPSR") %>% 
  ggplot() +
  geom_density(aes(x=RMPSR, color = intCtrlOrNot)) +
  theme_bw() +
  theme(text = element_text(size = 13),
        legend.position = c(0.6, 0.6),
        legend.background = element_blank(),
        axis.ticks.y = element_blank(),
        plot.margin = margin(r = 0, unit = "pt"),
        panel.grid = element_blank()) +
    labs(x = "Rel. mean protein synthesis rate") +
    #scale_color_manual(values = c("RMVPS"="black")) +  
    scale_color_manual(values = c("intCtrl"="blue", "nonCtrl"="black")) +  
    scale_x_log10() +
    geom_vline(xintercept = 1, linetype = "dashed") 

figS0_l
write_rds(figS0_l, "../figures/figS0_l.rds")
```



Fig S1
```{r fig.height = 6, fig.width=10}
trial_mRNAcount <- read_feather("../../simulations/trialmRNAcountData/trial_mRNAcount.feather")
trial_mRNAcount

figureS1 <- allSimInputOutput %>%
    left_join(., trial_mRNAcount[,c("paraCombo","ORF","trialRMMC")], by = c("paraCombo"="paraCombo", "ORF"="ORF")) %>%
    filter(paraCombo != "mRNAconstant") %>%
    select(paraCombo, RMMC, trialRMMC, dc, r) %>%
    `colnames<-`(c("paraCombo", "AfterScaling", "BeforeScaling", "dc", "r")) %>%
    pivot_longer(names_to = "key", values_to = "RMMCvalue", cols = 2:3) %>%
    ggplot(aes(x=RMMCvalue, color=key)) +
        geom_density() +
        facet_grid(dc~r, labeller=labeller(dc=c("1"="100%", "0.8"="80%", "0.6"="60%", "0.4"="40%", "0.2"="20%", "0"="Co-trns 0%"), r=c("0"="Ribo prot indx = 0", "0.1"="0.1", "0.4"="0.4", "1"="1"), label_parsed)) + 
        labs(title = "Fig S1: mRNA counts when varying are laregely equal to when they are constant \nafter scaling the mRNA synthesis rates", 
             x="Relative mean mRNA count") +
        scale_y_continuous() +
        theme_bw() +
        theme(text=element_text(size=13), 
              legend.title = element_blank(), 
              legend.position = "bottom")

figureS1

write_rds(figureS1, "../figures/figureS1.rds")
#ggsave(paste0(figureBaseFolder, "figures1/s_fig_1.png"), dpi=100, height = 6, width = 8)

###########################################################
allSimInputOutput %>% 
  filter(paraCombo != "mRNAconstant") %>% 
  select(paraCombo, RMMC, dc, r) %>% 
  ggplot(aes(x = RMMC)) + 
      geom_density() +
      facet_grid(dc~r, labeller=labeller(dc=c("1"="100%", "0.8"="80%", "0.6"="60%", "0.4"="40%", "0.2"="20%", "0"="Co-trns 0%"), r=c("0"="Ribo prot indx = 0", "0.1"="0.1", "0.4"="0.4", "1"="1"), label_parsed)) + 
      labs(x="Relative mean mRNA count after scaling") +
      scale_y_continuous() +
      theme_bw() +
      theme(text=element_text(size=13), 
            legend.title = element_blank(), 
            legend.position = "none") +
      geom_vline(xintercept = 1, linetype = "dashed")


###########################################################
allSimInputOutput %>%
    filter(paraCombo != "mRNAconstant") %>%
    select(paraCombo, RMMC, dc, r, geneLength_codon) %>%
    mutate(sORl = ifelse(geneLength_codon >=512, "long", "short")) %>%
    ggplot(aes(x=RMMC, color=sORl)) +
        geom_density() +
        facet_grid(dc~r, labeller=labeller(dc=c("1"="100%", "0.8"="80%", "0.6"="60%", "0.4"="40%", "0.2"="20%", "0"="Co-trns 0%"), r=c("0"="Ribo prot indx = 0", "0.1"="0.1", "0.4"="0.4", "1"="1"), label_parsed)) + 
        labs(x="Relative mean mRNA count") +
        scale_y_continuous() +
        theme_bw() +
        theme(legend.title = element_blank(), 
              legend.position = "bottom", 
              strip.text.x = element_text(size=10), 
              strip.text.y = element_text(size=10))
###########################################################
allSimInputOutput %>%
    filter(paraCombo != "mRNAconstant") %>%
    select(paraCombo, RMMC, dc, r, mRNADecRateNeymotin_sec) %>%
    mutate(fORs = ifelse(mRNADecRateNeymotin_sec >=0.0009431628, "fast", "slow")) %>%
    ggplot(aes(x=RMMC, color=fORs)) +
        geom_density() +
        facet_grid(dc~r, labeller=labeller(dc=c("1"="100%", "0.8"="80%", "0.6"="60%", "0.4"="40%", "0.2"="20%", "0"="Co-trns 0%"), r=c("0"="Ribo prot indx = 0", "0.1"="0.1", "0.4"="0.4", "1"="1"), label_parsed)) + 
        labs(x="Relative mean mRNA count") +
        scale_y_continuous() +
        theme_bw() +
        theme(legend.title = element_blank(), 
              legend.position = "bottom", 
              strip.text.x = element_text(size=10), 
              strip.text.y = element_text(size=10))


allSimInputOutput%>%
  filter(ORF!="YER053C-A", mRNADecRateNeymotin_sec!=0, paraCombo!="mRNAconstant") %>%
  mutate(dc_fct=factor(dc, levels=c("1", "0.8", "0.6", "0.4", "0.2", "0"))) %>%
  ggplot(aes(x=dc_fct, y=RMMC, fill=r)) +
  geom_boxplot(outlier.size = 0.1) +
  # geom_hline(aes(yintercept=median(as.numeric(unlist(allSimInputOutput%>%filter(ORF!="YER053C-A", mRNADecRateNeymotin_sec!=0, paraCombo=="dc_1_r_0")%>%select(RMMDR))), na.rm = TRUE)), color="red", linetype="dashed") +
  theme_bw() +
  labs(x="CMD level",
       y="Relative mean mRNA count") +
  scale_x_discrete(labels=c("1"="100%", "0.8"="80%", "0.6"="60%", "0.4"="40%", "0.2"="20%", "0"="0")) +
  scale_fill_discrete(name = "Ribosome\nprot index") +
  theme(
    text = element_text(size = 13),
    legend.position = "none"
  )
  

allSimInputOutput %>%
  group_by(paraCombo) %>%
  summarise(M = mean(RMMC)) %>%
  arrange(desc(M))

allSimInputOutput %>%
  group_by(dc) %>%
  summarise(M = mean(RMMC)) %>%
  arrange(desc(M))

```



Fig. was S3, now S2
```{r fig.height = 6, fig.width =  10}
figureS2 <- allSimInputOutput %>%
  filter(paraCombo != "mRNAconstant", ORF != "YER053C-A", mRNADecRateNeymotin_sec != 0) %>%
  ggplot(aes(x = MMC, y = MVMC)) +
  geom_point(size = 0.5) +
  geom_abline(linetype = "dashed") +
  facet_grid(dc~r, labeller = labeller(dc = c("1" = "100%", "0.8" = "80%", "0.6" = "60%", "0.4" = "40%", "0.2" = "20%", "0" = "Co-trns 0%"), r = c("0" = "Ribo prot indx  =  0", "0.1" = "0.1", "0.4" = "0.4", "1" = "1"), label_parsed)) +
  theme_bw() +
  theme(text = element_text(size = 13),
            legend.position = "none",
            plot.margin = margin(r = 0, unit = "pt"),
            panel.grid = element_blank()
    ) +
      labs(x = 'Mean of mRNA count',
           y = 'Variance of mRNA count') +
      geom_smooth(method = "lm") +
      stat_cor(aes(label = paste(..r.label..,  sep = "~`,`~")), label.x.npc = 0.7, label.y.npc = 0.4, size = 5) +
      scale_x_log10() +
      scale_y_log10()

figureS2
write_rds(figureS2, "../figures/figureS2.rds")

```




was Fig S4, now S3: Sequence features correlate with the fano factor of protein synthesis rates for mRNA constant
```{r fig.height = 3, fig.width = 8}
plot_fun1 <- function(var1, var2){ allSimInputOutput%>%  #var1:"MeanProteinSynRate".. var2:"mRNAconstant", "dc_1_r_0"
  filter(paraCombo == var2, mRNADecRateNeymotin_sec != 0) %>%
  select(ORF, MPSR, MVPS, iniProb_log10, mRNAabundance_log10, mRNADecRateNeymotin_sec_log10, CAI, geneLength_codon_log10) %>%
  mutate(fano_protSyn = MVPS/MPSR) %>%
  filter(fano_protSyn>0.3) %>%  # filter out the two outliers
  `colnames<-`(paste0("",c("ORF", "MeanProteinSynRate", "VarianceProteinSynRate", "iniProb_log10", "mRNALevel_log10", "DecRate_log10", "CAI", "geneLength_log10", "fano_protSynRate"))) %>%
  pivot_longer(names_to = "feature", values_to = "featureVals", !c(ORF,MeanProteinSynRate, VarianceProteinSynRate, fano_protSynRate)) %>%
  ggplot(aes_string(x = "featureVals", y = var1)) +
    geom_point(size = 0.5) +
    facet_wrap(~feature, scales = "free", nrow = 1, strip.position = "bottom") +
    theme_bw() +
    geom_smooth(method = "lm") +
    stat_cor(aes(label = paste(..r.label..,  sep = "~`,`~")), label.x.npc = 0.4, label.y.npc = 0.13, size = 3) +
  labs(x = "",
       y = var1) +
    scale_y_log10() +
  theme(text = element_text(size = 13),
        strip.text = element_text(color = "black"),  # can't use element_blank() here because it gives error when p1+p2
        strip.background = element_blank(),  
        strip.placement = "outside"     #to put the strip labels below x-axis
)
}

figureS3 <- plot_fun1("fano_protSynRate", "mRNAconstant")

figureS3
write_rds(figureS3, "../figures/figureS3.rds")
```

Was Fig S5, now S4. 
```{r fig.height = 4, fig.width = 6}
# MMDP = mRNAs marked for degradation proportion among mean total mRNA
figureS4 <- allSimInputOutput %>%
    filter(paraCombo == "dc_1_r_0", mRNADecRateNeymotin_sec != 0) %>%
    ggplot(aes(x = MMDP, y = RMPSR)) +
    geom_point(size = 0.1) +
    scale_x_log10() +
    scale_y_log10() +
    labs(x = "Proportion of mRNA marked for decay", 
        y = "Relative mean of protein synthesis rates", 
        title = "") +
    geom_smooth(method = "lm") + 
    stat_cor(aes(label = paste(..r.label..,  sep = "~`,`~")), label.x.npc = 0.1, label.y.npc = 0.3, size = 3) + 
    theme_bw() +
    theme(text=element_text(size = 13))

figureS4
write_rds(figureS4, "../figures/figureS4.rds")

```
Fig. S5
```{r fig.height = 4, fig.width = 6}
figureS5 <- allSimInputOutput %>%
    filter(paraCombo=="dc_1_r_0", ORF!="YER053C-A", mRNADecRateNeymotin_sec!=0) %>% 
    select("ORF", "CVPS", "CVMC", "paraCombo") %>% #remove the gene with the 450min HL
    ggplot(aes(x=CVMC, y=CVPS, colour=paraCombo)) +
    geom_point(size = 0.5) +
    geom_abline(linetype="dashed") +
    theme_bw() +
    theme(text = element_text(size = 13),
              legend.position = "none",
              strip.text = element_text(color="white"),  # can't use element_blank() here because it gives error when p1+p2
              plot.margin = margin(r = 0, unit = "pt"),
              panel.grid = element_blank()
      ) +
        labs(x ="CV for mRNA count per min",
             y = "CV for protein synthesis rate") +
        #scale_color_discrete(name="",labels=c("Co-trans 100% RiboProtect 0")) +
        geom_smooth(method="lm") +
        stat_cor(aes(label=paste(..r.label..,  sep = "~`, `~")), label.x.npc = 0.5, label.y.npc = 0.3, size=5) +
        scale_x_log10() + # not able to add the inset if i keep the log scales for either x or y
        scale_y_log10() +
        scale_color_manual(name="", labels=c("Co-trans 100% RiboProtect 0"), values = c("dc_1_r_0" = "black"))

figureS5
write_rds(figureS5, "../figures/figureS5.rds")
```


Fig S6: relative CV = CV of the protein synthesis rate/CV of the mRNA count
```{r fig.height = 3, fig.width = 8}
figureS6 <- allSimInputOutput %>%
  filter(paraCombo == "dc_1_r_0", mRNADecRateNeymotin_sec != 0, ORF != "YCR024C-B") %>%    #"YCR024C-B" is an outlier whose relCV = 23
  mutate(relCV = CVPS/CVMC) %>%
  select(ORF, relCV, iniProb_log10, mRNAabundance_log10, mRNADecRateNeymotin_sec_log10, CAI, geneLength_codon_log10) %>%
    `colnames<-`(paste0("", c("ORF", "Relative_CV", "iniProb_log10", "mRNALevel_log10", "DecRate_log10", "CAI", "geneLength_log10"))) %>%
  pivot_longer(names_to = "feature", values_to = "featureVals", -c(ORF, Relative_CV)) %>%
  ggplot(aes(x = featureVals, y = Relative_CV)) +
    geom_point(size = 0.5) +
      facet_wrap(~feature, scales = "free", nrow = 1, strip.position = "bottom") +
      theme_bw() +
      geom_smooth(method = "lm") +
      stat_cor(aes(label = paste(..r.label..,  sep = "~`,`~")), label.x.npc = 0.15, label.y.npc = 0.8, size = 3) +
    labs(x = "",
         y = "Relative CV") +
      scale_y_log10() +
      theme(text = element_text(size = 13),
            strip.text = element_text(color = "black"),  # can't use element_blank() here because it gives error when p1+p2
            strip.background = element_blank(),  
            strip.placement = "outside")     #to put the strip labels below x-axis

figureS6
write_rds(figureS6, "../figures/figureS6.rds")

```

Fig. S7: 
```{r fig.height = 4, fig.width = 7}
figureS7 <- allSimInputOutput %>%
    filter(paraCombo == "dc_1_r_0", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B") %>%
    select(MTT, MMDP, geneLength_codon, RMMDR) %>%
    `colnames<-` (c("MeanTransTime", "mRNAMarkdDecProp", "geneLength_codon", "RelativeDecRate")) %>%
    pivot_longer(names_to = "feature", values_to = "featureVals", !geneLength_codon) %>%
    ggplot(aes(x = featureVals, y = geneLength_codon)) +
    geom_point(size = 0.1) +
    facet_wrap(~feature, scales = "free_x", nrow = 1, strip.position = "bottom") +
    scale_x_log10() +
    scale_y_log10() +
    labs(x = "",
        y = "Gene length (codon)",
        title = "dc_1_r_0") +
    geom_smooth(method = "lm") + 
    stat_cor(aes(label = paste(..r.label..,  sep = "~`, `~")), label.x.npc = 0.3, label.y.npc = 0.1, size = 3) + 
    theme_bw() +
    theme(text = element_text(size = 13),
          strip.text = element_text(color = "black"),  # can't use element_blank() here because it gives error when p1+p2
          strip.background = element_blank(),  
          strip.placement = "outside")

figureS7
write_rds(figureS7, "../figures/figureS7.rds")
###################################################

allSimInputOutput %>%
    filter(paraCombo == "dc_1_r_1", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A",ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B") %>%
    select(MTT, MMDP, geneLength_codon, RMMDR) %>%
    `colnames<-` (c("MeanTransTime", "mRNAMarkdDecProp", "geneLength_codon", "RelativeDecRate")) %>%
    pivot_longer(names_to = "feature", values_to = "featureVals", !geneLength_codon) %>%
    ggplot(aes(x = featureVals, y = geneLength_codon)) +
    geom_point(size = 0.1) +
    facet_wrap(~feature, scales = "free_x", nrow = 1, strip.position = "bottom") +
    scale_x_log10() +
    scale_y_log10() +
    labs(x = "",
        y = "Gene length (codon)",
        title = "dc_1_r_1") +
    geom_smooth(method = "lm") + 
    stat_cor(aes(label = paste(..r.label..,  sep = "~`,`~")), label.x.npc = 0.3, label.y.npc = 0.1, size = 3) + 
    theme_bw() +
    theme(text = element_text(size = 13),
          strip.text = element_text(color = "black"),  # can't use element_blank() here because it gives error when p1+p2
          strip.background = element_blank(),  
          strip.placement = "outside")


tmp <- allSimInputOutput %>%
       filter(paraCombo == "dc_1_r_0", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A",ORF != "YGR169C-A", ORF != "YLR106C",ORF != "YCR024C-B") %>%
       mutate(RDR = MMDR/mRNADecRateNeymotin_sec) %>%
       select(RMTE, geneLength_codon, RDR) 
summary(lm(RMTE~geneLength_codon+RDR, tmp))

# MMDP = mRNAs marked for degradation proportion among mean total mRNA
# MTT = mean translation time
allSimInputOutput %>%
    filter(paraCombo == "dc_1_r_0", mRNADecRateNeymotin_sec != 0) %>%
    ggplot(aes(x = MTT, y = MMDP)) +
    geom_point(size = 0.1) +
    scale_x_log10() +
    scale_y_log10() +
    labs(x = "Mean translation time",
        y = "Proportion of mRNA marked for decay",
        title = "") +
    geom_smooth(method = "lm") + 
    stat_cor(aes(label = paste(..r.label..,  sep = "~`, `~")), label.x.npc = 0.1, label.y.npc = 0.3, size = 3) + 
    theme_bw() 


allSimInputOutput %>%
    filter(paraCombo == "dc_0.2_r_0", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B") %>%
    select(MTT, MMDP, geneLength_codon, RMMDR) %>%
    `colnames<-` (c("MeanTransTime", "mRNAMarkdDecProp", "geneLength_codon", "RelativeDecRate")) %>%
    pivot_longer(names_to = "feature", values_to = "featureVals", !geneLength_codon) %>%
    ggplot(aes(x = featureVals, y = geneLength_codon)) +
    geom_point(size = 0.1) +
    facet_wrap(~feature, scales = "free_x", nrow = 1, strip.position = "bottom") +
    scale_x_log10() +
    scale_y_log10() +
    labs(x = "",
        y = "Gene length (codon)",
        title = "dc_0.2_r_0") +
    geom_smooth(method = "lm") + 
    stat_cor(aes(label = paste(..r.label..,  sep = "~`,`~")), label.x.npc = 0.3, label.y.npc = 0.1, size = 3) + 
    theme_bw() +
    theme(text = element_text(size = 13),
          strip.text = element_text(color = "black"),  # can't use element_blank() here because it gives error when p1+p2
          strip.background = element_blank(),  
          strip.placement = "outside")


allSimInputOutput %>%
    filter(paraCombo == "dc_0.2_r_1", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B") %>%
    select(MTT, MMDP, geneLength_codon, RMMDR) %>%
    `colnames<-` (c("MeanTransTime", "mRNAMarkdDecProp", "geneLength_codon", "RelativeDecRate")) %>%
    pivot_longer(names_to = "feature", values_to = "featureVals", !geneLength_codon) %>%
    ggplot(aes(x = featureVals, y = geneLength_codon)) +
    geom_point(size = 0.1) +
    facet_wrap(~feature, scales = "free_x", nrow = 1, strip.position = "bottom") +
    scale_x_log10() +
    scale_y_log10() +
    labs(x = "",
        y = "Gene length (codon)",
        title = "dc_0.2_r_1") +
    geom_smooth(method = "lm") + 
    stat_cor(aes(label = paste(..r.label..,  sep = "~`, `~")), label.x.npc = 0.3, label.y.npc = 0.1, size = 3) + 
    theme_bw() +
    theme(text = element_text(size = 13),
          strip.text = element_text(color = "black"),  # can't use element_blank() here because it gives error when p1+p2
          strip.background = element_blank(),  
          strip.placement = "outside")
```



Fig. S8
```{r fig.height = 4, fig.width = 7}
figureS8 <- allSimInputOutput %>%
    filter(paraCombo == "dc_1_r_0", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B") %>%
    select(RMTE, MTT, MMDP, geneLength_codon, RMMDR) %>%
    `colnames<-` (c("RelMeanTE", "MeanTransTime", "mRNAMarkdDecProp", "geneLength_codon", "RelativeDecRate")) %>%
    pivot_longer(names_to = "feature", values_to = "featureVals", !RelMeanTE) %>%
    ggplot(aes(x = featureVals, y = RelMeanTE)) +
    geom_point(size = 0.1) +
    facet_wrap(~feature, scales = "free_x", nrow = 1, strip.position = "bottom") +
    scale_x_log10() +
    scale_y_log10() +
    labs(x = "",
        y = "Relative mean TE",
        title = "dc_1_r_0") +
    geom_smooth(method = "lm") + 
    stat_cor(aes(label = paste(..r.label..,  sep = "~`, `~")), label.x.npc = 0.3, label.y.npc = 0.1, size = 3) + 
    theme_bw() +
    theme(text = element_text(size = 13),
        axis.text.x = element_text(size = rel(0.8)),
        strip.text = element_text(color = "black"),  # can't use element_blank() here because it gives error when p1+p2
        strip.background = element_blank(),  
        strip.placement = "outside")

figureS8
write_rds(figureS8, "../figures/figureS8.rds")

#############################################

allSimInputOutput %>%
    filter(paraCombo == "dc_0.8_r_0", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B") %>%
    select(RMTE, MTT, MMDP, geneLength_codon, RMMDR) %>%
    `colnames<-` (c("RelMeanTE", "MeanTransTime", "mRNAMarkdDecProp", "geneLength_codon", "RelativeDecRate")) %>%
    pivot_longer(names_to = "feature", values_to = "featureVals", !RelMeanTE) %>%
    ggplot(aes(x = featureVals, y = RelMeanTE)) +
    geom_point(size = 0.1) +
    facet_wrap(~feature, scales = "free_x", nrow = 1, strip.position = "bottom") +
    scale_x_log10() +
    scale_y_log10() +
    labs(x = "",
        y = "Relative mean TE",
        title = "dc_0.8_r_0") +
    geom_smooth(method = "lm") + 
    stat_cor(aes(label = paste(..r.label..,  sep = "~`, `~")), label.x.npc = 0.3, label.y.npc = 0.1, size = 3) + 
    theme_bw() +
    theme(text = element_text(size = 13),
        axis.text.x = element_text(size = rel(0.8)),
        strip.text = element_text(color = "black"),  # can't use element_blank() here because it gives error when p1+p2
        strip.background = element_blank(),  
        strip.placement = "outside")

allSimInputOutput %>%
    filter(paraCombo == "dc_0.6_r_0", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B") %>%
    select(RMTE, MTT, MMDP, geneLength_codon, RMMDR) %>%
    `colnames<-` (c("RelMeanTE", "MeanTransTime", "mRNAMarkdDecProp", "geneLength_codon", "RelativeDecRate")) %>%
    pivot_longer(names_to = "feature", values_to = "featureVals", !RelMeanTE) %>%
    ggplot(aes(x = featureVals, y = RelMeanTE)) +
    geom_point(size = 0.1) +
    facet_wrap(~feature, scales = "free_x", nrow = 1, strip.position = "bottom") +
    scale_x_log10() +
    scale_y_log10() +
    labs(x = "",
        y = "Relative mean TE",
        title = "dc_0.6_r_0") +
    geom_smooth(method = "lm") + 
    stat_cor(aes(label = paste(..r.label..,  sep = "~`, `~")), label.x.npc = 0.3, label.y.npc = 0.1, size = 3) + 
    theme_bw() +
    theme(text = element_text(size = 13),
        axis.text.x = element_text(size = rel(0.8)),
        strip.text = element_text(color = "black"),  # can't use element_blank() here because it gives error when p1+p2
        strip.background = element_blank(),  
        strip.placement = "outside")

allSimInputOutput %>%
    filter(paraCombo == "dc_0.4_r_0", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B") %>%
    select(RMTE, MTT, MMDP, geneLength_codon, RMMDR) %>%
    `colnames<-` (c("RelMeanTE", "MeanTransTime", "mRNAMarkdDecProp", "geneLength_codon", "RelativeDecRate")) %>%
    pivot_longer(names_to = "feature", values_to = "featureVals", !RelMeanTE) %>%
    ggplot(aes(x = featureVals, y = RelMeanTE)) +
    geom_point(size = 0.1) +
    facet_wrap(~feature, scales = "free_x", nrow = 1,strip.position = "bottom") +
    scale_x_log10() +
    scale_y_log10() +
    labs(x = "",
        y = "Relative mean TE",
        title = "dc_0.4_r_0") +
    geom_smooth(method = "lm") + 
    stat_cor(aes(label = paste(..r.label..,  sep = "~`, `~")), label.x.npc = 0.3, label.y.npc = 0.1, size = 3) + 
    theme_bw() +
    theme(text = element_text(size = 13),
        axis.text.x = element_text(size = rel(0.8)),
        strip.text = element_text(color = "black"),  # can't use element_blank() here because it gives error when p1+p2
        strip.background = element_blank(),  
        strip.placement = "outside")


allSimInputOutput %>%
    filter(paraCombo == "dc_0.2_r_0", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B") %>%
    select(RMTE, MTT, MMDP, geneLength_codon, RMMDR) %>%
    `colnames<-` (c("RelMeanTE", "MeanTransTime", "mRNAMarkdDecProp", "geneLength_codon", "RelativeDecRate")) %>%
    pivot_longer(names_to = "feature", values_to = "featureVals", !RelMeanTE) %>%
    ggplot(aes(x = featureVals, y = RelMeanTE)) +
    geom_point(size = 0.1) +
    facet_wrap(~feature, scales = "free_x", nrow = 1, strip.position = "bottom") +
    scale_x_log10() +
    scale_y_log10() +
    labs(x = "",
        y = "Relative mean TE",
        title = "dc_0.2_r_0") +
    geom_smooth(method = "lm") + 
    stat_cor(aes(label = paste(..r.label..,  sep = "~`, `~")), label.x.npc = 0.3, label.y.npc = 0.1, size = 3) + 
    theme_bw() +
    theme(text = element_text(size = 13),
        axis.text.x = element_text(size = rel(0.8)),
        strip.text = element_text(color = "black"),  # can't use element_blank() here because it gives error when p1+p2
        strip.background = element_blank(),  
        strip.placement = "outside")


allSimInputOutput %>%
    filter(paraCombo == "dc_0_r_0", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B") %>%
    select(RMTE, MTT, MMDP, geneLength_codon, RMMDR) %>%
    `colnames<-` (c("RelMeanTE", "MeanTransTime", "mRNAMarkdDecProp", "geneLength_codon", "RelativeDecRate")) %>%
    pivot_longer(names_to = "feature", values_to = "featureVals", !RelMeanTE) %>%
    ggplot(aes(x = featureVals, y = RelMeanTE)) +
    geom_point(size = 0.1) +
    facet_wrap(~feature, scales = "free_x", nrow = 1, strip.position = "bottom") +
    scale_x_log10() +
    scale_y_log10() +
    labs(x = "",
        y = "Relative mean TE",
        title = "dc_0_r_0") +
    geom_smooth(method = "lm") + 
    stat_cor(aes(label = paste(..r.label..,  sep = "~`, `~")), label.x.npc = 0.3, label.y.npc = 0.1, size = 3) + 
    theme_bw() +
    theme(text = element_text(size = 13),
        axis.text.x = element_text(size = rel(0.8)),
        strip.text = element_text(color="black"),  # can't use element_blank() here because it gives error when p1+p2
        strip.background = element_blank(),  
        strip.placement = "outside")

allSimInputOutput %>%
    filter(paraCombo == "dc_1_r_1", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B") %>%
    select(RMTE, MTT, MMDP, geneLength_codon, RMMDR) %>%
    `colnames<-` (c("RelMeanTE", "MeanTransTime", "mRNAMarkdDecProp", "geneLength_codon", "RelativeDecRate")) %>%
    pivot_longer(names_to = "feature", values_to = "featureVals", !RelMeanTE) %>%
    ggplot(aes(x = featureVals, y = RelMeanTE)) +
    geom_point(size = 0.1) +
    facet_wrap(~feature, scales = "free_x", nrow = 1, strip.position = "bottom") +
    scale_x_log10() +
    scale_y_log10() +
    labs(x = "",
        y = "Relative mean TE",
        title = "dc_1_r_1") +
    geom_smooth(method = "lm") + 
    stat_cor(aes(label = paste(..r.label..,  sep = "~`, `~")), label.x.npc = 0.3, label.y.npc = 0.1, size = 3) + 
    theme_bw() +
    theme(text=element_text(size = 13),
        axis.text.x = element_text(size = rel(0.8)),
        strip.text = element_text(color = "black"),  # can't use element_blank() here because it gives error when p1+p2
        strip.background = element_blank(),  
        strip.placement = "outside")


allSimInputOutput %>%
    filter(paraCombo == "dc_0.2_r_1", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B") %>%
    select(RMTE, MTT, MMDP, geneLength_codon, RMMDR) %>%
    `colnames<-` (c("RelMeanTE", "MeanTransTime", "mRNAMarkdDecProp", "geneLength_codon", "RelativeDecRate")) %>%
    pivot_longer(names_to = "feature", values_to = "featureVals", !RelMeanTE) %>%
    ggplot(aes(x = featureVals, y = RelMeanTE)) +
    geom_point(size = 0.1) +
    facet_wrap(~feature, scales = "free_x", nrow = 1, strip.position = "bottom") +
    scale_x_log10() +
    scale_y_log10() +
    labs(x = "",
        y = "Relative mean TE",
        title = "dc_0.2_r_1") +
    geom_smooth(method = "lm") + 
    stat_cor(aes(label = paste(..r.label..,  sep = "~`, `~")), label.x.npc = 0.3, label.y.npc = 0.1, size = 3) + 
    theme_bw() +
    theme(text = element_text(size = 13),
        axis.text.x = element_text(size = rel(0.8)),
        strip.text = element_text(color = "black"),  # can't use element_blank() here because it gives error when p1+p2
        strip.background = element_blank(),  
        strip.placement = "outside")


allSimInputOutput %>%
    filter(paraCombo == "dc_1_r_0", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B") %>%
    select(MMDP, RMMDR) %>%
    ggplot(aes(x = MMDP, y = RMMDR)) +
    geom_point(size = 0.1) +
    labs(x = "MMDP",
        y = "Relative decay rates",
        title = "dc_1_r_0") +
    geom_smooth(method = "lm") + 
    stat_cor(aes(label = paste(..r.label..,  sep = "~`, `~")), label.x.npc = 0.3, label.y.npc = 0.1, size = 3) + 
    theme_bw() +
    theme(text = element_text(size = 13),
        axis.text.x = element_text(size = rel(0.8)),
        strip.text = element_text(color = "black"),  # can't use element_blank() here because it gives error when p1+p2
        strip.background = element_blank(),  
        strip.placement = "outside")

# MMDP = mRNAs marked for degradation proportion
allSimInputOutput %>%
    filter(paraCombo == "dc_0.2_r_0", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B") %>%
    select(MMDP, RMMDR) %>%
    ggplot(aes(x = MMDP, y = RMMDR)) +
    geom_point(size = 0.1) +
    scale_x_log10() +
    scale_y_log10() +
    labs(x = "MMDP",
        y = "Relative decay rates",
        title = "dc_0.2_r_0") +
    geom_smooth(method = "lm") + 
    stat_cor(aes(label = paste(..r.label..,  sep = "~`, `~")), label.x.npc = 0.3, label.y.npc = 0.1, size = 3) + 
    theme_bw() +
    theme(text = element_text(size = 13),
        axis.text.x = element_text(size = rel(0.8)),
        strip.text = element_text(color = "black"),  # can't use element_blank() here because it gives error when p1+p2
        strip.background = element_blank(),  
        strip.placement = "outside")
```

Fig. S9
```{r fig.height = 7, fig.width = 10}
figureS9 <- allSimInputOutput %>%
  filter(paraCombo != "mRNAconstant", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B", dc != 0) %>%
  #select(RMTE, MTT, MMDP, geneLength_codon, RMMDR) %>%
  ggplot(aes(x = MMDP, y = RMTE)) +
  geom_point(size = 0.1) +
  facet_grid(dc~r, labeller = labeller(dc = c("1" = "100%", "0.8" = "80%", "0.6" = "60%", "0.4" = "40%", "0.2" = "Co-trns 20%"), r = c("0" = "Ribo prot indx  =  0", "0.1" = "0.1", "0.4" = "0.4", "1" = "1"), label_parsed)) +
  theme_bw() +
  theme(text = element_text(size = 13),
            legend.position = "none",
            plot.margin = margin(r = 0, unit = "pt"),
            panel.grid = element_blank()
    ) +
      labs(x = 'Proportions of mRNAs undergoing CMD for all genes',
           y = 'Relative mean translation efficiencies') +
      geom_smooth(method = "lm") +
      stat_cor(aes(label = paste(..r.label..,  sep = "~`,`~")), label.x.npc = 0.2, label.y.npc = 0.4, size = 5) +
      scale_x_log10() +
      scale_y_log10()

figureS9
write_rds(figureS9, "../figures/figureS9.rds")

##############################################################

allSimInputOutput %>%
  filter(paraCombo != "mRNAconstant", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B", , r==0|r==1, dc==0.2|dc==1) %>%
  #select(RMTE, MTT, MMDP, geneLength_codon, RMMDR) %>%
  ggplot(aes(x = MMDP, y = RMTE)) +
  geom_point(size = 0.1) +
  facet_grid(dc~r, labeller = labeller(dc = c("1" = "100%", "0.8" = "80%", "0.6" = "60%", "0.4" = "40%", "0.2" = "Co-trns 20%"), r = c("0" = "Ribo prot indx  =  0", "0.1" = "0.1", "0.4" = "0.4", "1" = "1"), label_parsed)) +
  theme_bw() +
  theme(text = element_text(size = 13),
            legend.position = "none",
            plot.margin = margin(r = 0, unit = "pt"),
            panel.grid = element_blank()
    ) +
      labs(x = 'Proportions of mRNAs undergoing CMD for all genes',
           y = 'Relative mean translation efficiencies') +
      geom_smooth(method = "lm") +
      stat_cor(aes(label = paste(..r.label..,  sep = "~`,`~")), label.x.npc = 0.2, label.y.npc = 0.4, size = 5) +
      scale_x_log10() +
      scale_y_log10()
```

Fig. S10
```{r fig.height = 7, fig.width = 10}
figureS10 <- allSimInputOutput %>%
  filter(paraCombo != "mRNAconstant", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B") %>%
  #select(RMTE, MTT, MMDP, geneLength_codon, RMMDR) %>%
  ggplot(aes(x = RMMDR, y = RMTE)) +
  geom_point(size = 0.1) +
  facet_grid(dc~r, labeller = labeller(dc = c("1" = "100%", "0.8" = "80%", "0.6" = "60%", "0.4" = "40%", "0.2" = "20%", "0" = "Co-trns 0%"), r = c("0" = "Ribo prot indx  =  0", "0.1" = "0.1", "0.4" = "0.4", "1" = "1"), label_parsed)) +
  theme_bw() +
  theme(text = element_text(size = 13),
            legend.position = "none",
            plot.margin = margin(r = 0, unit = "pt"),
            panel.grid = element_blank()
    ) +
      labs(x = 'Relative mRNA decay rates',
           y = 'Relative mean translation efficiencies') +
      geom_smooth(method = "lm") +
      stat_cor(aes(label = paste(..r.label..,  sep = "~`,`~")), label.x.npc = 0.2, label.y.npc = 0.4, size = 5) +
      scale_x_log10() +
      scale_y_log10()

figureS10
write_rds(figureS10, "../figures/figureS10.rds")
#########################################################

allSimInputOutput %>%
  filter(paraCombo != "mRNAconstant", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", ORF != "YGR169C-A", ORF != "YLR106C", ORF != "YCR024C-B", r==0|r==1, dc==0|dc==1) %>%
  #select(RMTE, MTT, MMDP, geneLength_codon, RMMDR) %>%
  ggplot(aes(x = RMMDR, y = RMTE)) +
  geom_point(size = 0.1) +
  facet_grid(dc~r, labeller = labeller(dc = c("1" = "100%", "0.8" = "80%", "0.6" = "60%", "0.4" = "40%", "0.2" = "20%", "0" = "Co-trns 0%"), r = c("0" = "Ribo prot indx  =  0", "0.1" = "0.1", "0.4" = "0.4", "1" = "1"), label_parsed)) +
  theme_bw() +
  theme(text = element_text(size = 13),
            legend.position = "none",
            plot.margin = margin(r = 0, unit = "pt"),
            panel.grid = element_blank()
    ) +
      labs(x = 'Relative mRNA decay rates',
           y = 'Relative mean translation efficiencies') +
      geom_smooth(method = "lm") +
      stat_cor(aes(label = paste(..r.label..,  sep = "~`,`~")), label.x.npc = 0.2, label.y.npc = 0.4, size = 5) +
      scale_x_log10() +
      scale_y_log10()
```


was Fig. S9, maybe should not use it coz the vline calculated from its input decay rate may not be accurate.
```{r}
lifetimeDistri<- function(genevec){
    dfplot <- cbind(dc.r.df[c(2:5, 22:25), ], data.frame(matrix(NA, ncol = 5000, nrow = 8*3))) %>%
        mutate(ORF = c(rep(genevec[1], 8), rep(genevec[2], 8), rep(genevec[3], 8))) %>%
        relocate(ORF)
    
    for(i in 1:8){dfplot[i, 6:5005] = as.vector(h5read(simOutputH5, paste0(genevec[1], "/mRNA_lifeTimes/", dfplot$paraCombo[i])))}
    for(i in 9:16){dfplot[i, 6:5005] = as.vector(h5read(simOutputH5, paste0(genevec[2], "/mRNA_lifeTimes/", dfplot$paraCombo[i])))}
    for(i in 17:24){dfplot[i, 6:5005] = as.vector(h5read(simOutputH5, paste0(genevec[3], "/mRNA_lifeTimes/", dfplot$paraCombo[i])))}
    
    dfplot %>%
        pivot_longer(names_to = "varyingParaCombo", values_to = "lifeTimes", cols = 6:5005) %>%
        ggplot(aes(lifeTimes, fill = dc)) +
        geom_density(alpha = 0.5, color = NA) +
        facet_grid(factor(ORF, levels = genevec)~r, 
                   labeller = labeller(r = c("0" = "Ribo prot index 0", "0.1" = "0.1", "0.4" = "0.4", "1" = "1"))) +
        scale_x_log10(labels = scales::comma_format(accuracy = 1L)) +
        scale_fill_discrete(name = "CMD level",
                            labels = c("0" = "0", "0.2" = "20%", "0.6" = "60%", "1" = "100%")) +
        theme_bw() +
        labs(x = paste0("mRNA life time distribution (log10)")) +
        theme(
          legend.position = "top",
          legend.justification = "left",
          text = element_text(size = 13),
          axis.text.x = element_text(size = 8)) +
        geom_vline(data = filter(dfplot, ORF == genevec[1]), aes(xintercept = 1/simInputFeatures$mRNADecRateNeymotin_sec[which(simInputFeatures$ORF == genevec[1])]), linetype = "dashed", color = "dark grey") + #1049.856 =1/simInputFeatures$mRNADecRateNeymotin_sec[1] # 1049.856 is the input lifetime for YAL001C 
        geom_vline(data = filter(dfplot, ORF == genevec[2]), aes(xintercept = 1/simInputFeatures$mRNADecRateNeymotin_sec[which(simInputFeatures$ORF == genevec[2])]), linetype = "dashed", color = "dark grey") +
        geom_vline(data = filter(dfplot, ORF == genevec[3]), aes(xintercept = 1/simInputFeatures$mRNADecRateNeymotin_sec[which(simInputFeatures$ORF == genevec[3])]), linetype = "dashed", color = "dark grey") 
        # the above lines are the average life time calculated from input decay rates
}

lifetimeDistri(c("YAL001C", "YKR075C", "YBR011C"))
lifetimeDistri(c("YLR106C", "YKR054C", "YHR099W")) # longest genes
lifetimeDistri(c("YAR002C-A", "YBL050W", "YBR003W"))

```

```{r fig.height = 5, fig.width=12}
allSimInputOutput %>%
    filter(paraCombo == "dc_0_r_0", mRNADecRateNeymotin_sec != 0, mRNAabundance>1, ORF!="YER053C-A", ORF!="YLR106C") %>%  #remove the gene with HL=450min, also an outlier gene "YLR106C" with RMTE==0.6
    select(ORF, paraCombo, RMTE, mRNAabundance_log10, iniProb_log10, mRNADecRateNeymotin_sec_log10, CAI, geneLength_codon_log10) %>%
    `colnames<-`(c("ORF", "paraCombo", "RMTE", "log(mRNAabundance)", "log(IniProb)", "log(DecRate)", "CAI", "log(Length)")) %>%
    pivot_longer(cols = -c(RMTE, paraCombo, ORF), names_to = "feature", values_to = "featureVal") %>%
    ggplot(aes(x=featureVal, y=RMTE, color=paraCombo)) +
    geom_point(size=0.5) +
    facet_wrap(~feature, scales = "free", nrow=1, strip.position = "bottom") +
    theme_bw() +
    scale_y_log10() +
    theme(text = element_text(size = 13),
              legend.position = "none",
              strip.text = element_text(color="black", size=rel(1.2)),  # can't use element_blank() here because it gives error when p1+p2
              plot.margin = margin(r = 0, unit = "pt"),
              panel.grid = element_blank(),
              strip.background = element_blank(),  
              strip.placement = "outside"     #to put the strip labels below x-axis
      ) +
        labs(x = "",
             y = "Relative mean translation efficiency",
             title = "dc_0_r_0") +
        geom_smooth(method="lm") +
        stat_cor(aes(label=paste(..r.label..,  sep = "~`,`~")), label.x.npc = 0.3, label.y.npc = 0.2, size=5) +
        scale_color_manual(name="", labels=c(""), values = c("dc_1_r_0" = "#1F78B4"))



allSimInputOutput %>%
    filter(paraCombo == "dc_0_r_1", mRNADecRateNeymotin_sec != 0, mRNAabundance>1, ORF!="YER053C-A", ORF!="YLR106C") %>%  #remove the gene with HL=450min, also an outlier gene "YLR106C" with RMTE==0.6
    select(ORF, paraCombo, RMTE, mRNAabundance_log10, iniProb_log10, mRNADecRateNeymotin_sec_log10, CAI, geneLength_codon_log10) %>%
    `colnames<-`(c("ORF", "paraCombo", "RMTE", "log(mRNAabundance)", "log(IniProb)", "log(DecRate)", "CAI", "log(Length)")) %>%
    pivot_longer(cols = -c(RMTE, paraCombo, ORF), names_to = "feature", values_to = "featureVal") %>%
    ggplot(aes(x=featureVal, y=RMTE, color=paraCombo)) +
    geom_point(size=0.5) +
    facet_wrap(~feature, scales = "free", nrow=1, strip.position = "bottom") +
    theme_bw() +
    scale_y_log10() +
    theme(text = element_text(size = 13),
              legend.position = "none",
              strip.text = element_text(color="black", size=rel(1.2)),  # can't use element_blank() here because it gives error when p1+p2
              plot.margin = margin(r = 0, unit = "pt"),
              panel.grid = element_blank(),
              strip.background = element_blank(),  
              strip.placement = "outside"     #to put the strip labels below x-axis
      ) +
        labs(x = "",
             y = "Relative mean translation efficiency",
             title = "dc_0_r_1") +
        geom_smooth(method="lm") +
        stat_cor(aes(label=paste(..r.label..,  sep = "~`,`~")), label.x.npc = 0.3, label.y.npc = 0.2, size=5) +
        scale_color_manual(name="", labels=c(""), values = c("dc_1_r_0" = "#1F78B4"))



allSimInputOutput %>%
    filter(paraCombo == "dc_1_r_1", mRNADecRateNeymotin_sec != 0, mRNAabundance>1, ORF!="YER053C-A", ORF!="YLR106C") %>%  #remove the gene with HL=450min, also an outlier gene "YLR106C" with RMTE==0.6
    select(ORF, paraCombo, RMTE, mRNAabundance_log10, iniProb_log10, mRNADecRateNeymotin_sec_log10, CAI, geneLength_codon_log10) %>%
    `colnames<-`(c("ORF", "paraCombo", "RMTE", "log(mRNAabundance)", "log(IniProb)", "log(DecRate)", "CAI", "log(Length)")) %>%
    pivot_longer(cols = -c(RMTE, paraCombo, ORF), names_to = "feature", values_to = "featureVal") %>%
    ggplot(aes(x=featureVal, y=RMTE, color=paraCombo)) +
    geom_point(size=0.5) +
    facet_wrap(~feature, scales = "free", nrow=1, strip.position = "bottom") +
    theme_bw() +
    scale_y_log10() +
    theme(text = element_text(size = 13),
              legend.position = "none",
              strip.text = element_text(color="black", size=rel(1.2)),  # can't use element_blank() here because it gives error when p1+p2
              plot.margin = margin(r = 0, unit = "pt"),
              panel.grid = element_blank(),
              strip.background = element_blank(),  
              strip.placement = "outside"     #to put the strip labels below x-axis
      ) +
        labs(x = "",
             y = "Relative mean translation efficiency",
             title = "dc_1_r_1") +
        geom_smooth(method="lm") +
        stat_cor(aes(label=paste(..r.label..,  sep = "~`,`~")), label.x.npc = 0.3, label.y.npc = 0.2, size=5) +
        scale_color_manual(name="", labels=c(""), values = c("dc_1_r_0" = "#1F78B4"))


```




```{r}
tmpdf <- data.frame(lifetime = log10(as.numeric(dfplot[1, 6:5005])))
which.max(density(tmpdf$lifetime)$y)
density(tmpdf$lifetime)$x[387]
ggplot(tmpdf, aes(lifetime)) + geom_density() + geom_vline(xintercept = density(tmpdf$lifetime)$x[387]) 


```


Fig. S

NOTES: 
Output decay rate = 1/mean lifetime <https://en.wikipedia.org/wiki/Particle_decay>

Total output decay rate = output decay rate * output mean mRNA count

Total input decay rate = input decay rate * mRNAabundance

Total synthesis rate = a scaled constant

(The above rates are all gene-specific)

Summary: changing total output decay rate is a result of changing co-translational decay and ribosome protection. In order to maintain the constant mRNA level, we have to scale the total synthesis rates to counter-effect the changing output decay rates.

When co-translational decay is higher than 0, there's always a surplus of mRNAs marked for decay, that are not accounted when calculating total decay probabilities (They're not accounted because they already have decay machinery bound to them, so cannot be accounted again into the mRNA pool that can still be degraded). Therefore the synthesis rates are scaled, in order to maintain a stable relative mRNA count (= mean output mRNA count/mRNAabundance) for it to be close to 1 (Supp Fig 1). The mean output mRNA count for each gene is a result of the balance between its scaled synthesis rate and total output decay rate. In other words, the total output decay rate directly respond to the scaled synthesis rate, rather than the input decay rate. 

The scaled total synthesis rates are the smallest when co-translational decay = 100%, so that the total real-time mRNA count can be close to mRNAabundance even with the highest amount of mRNAs marked for decay. In contrast, the scaled total synthesis rates are the largest and equal to the total input decay rates when co-trans decay = 0% (Supp Fig 2a), because there is 0 mRNA marked for decay. 

Hypothetically, the total output decay rates should equal to the total synthesis rates in order to maintain the real-time mRNA count to be largely the same at the beginning and the end of the simulation. If unequal, the real-time mRNA count should either go up or down as the simulation continues compared to the begining amount (i.e. mRNAabundance). However, our results show that the total output decay rates are slightly larger than the scaled synthesis rates across all the parameter combos (Supp Fig 2b. this is the part I don't understand, is it coz the total output decay rates include considering mRNAsMarkedForDecay, but the total scaled synthesis rates doesn't include mRNAsMarkedForDecay), and that's somehow contributing to the mean real-time mRNA count being equal to mRNAabundance as shown in Supp Fig 1. 

Because the output decay rates directly respond to total synthesis rates, they are influenced by the para combos in the same way that total synthesis rates are. That explains why Supp Fig 2c is similar to Supp Fig 2a in that the peaks skew to the right as co-translational decay ratio goes down. However in Supp Fig 2a, the ratio (scaled synthesis rates V.S. total input decay rates) skewed from less than 1 to 1; while in Supp Fig 2c, the ratio (total output decay rates V.S. total input decay rates) skewed from 1 to larger than 1. This would make sense if we can explain what's going on in Supp Fig 2b. 

Meanwhile, the output decay rates for short genes are much less affected by different co-translational decay proportions than long genes (Supp Fig 2d). This should be a reflection that the total synthesis rates for short genes are changing less with changing co-translational decay.

Supp Fig 2a: The scaled synthesis rates are the smallest when co-trans decay = 100%, while they\nare the largest and equal to the total input decay rates when co-trans decay = 0% 

Supp Fig 2b: Total output mRNA decay rates are slightly larger than scaled mRNA synthesis rates \n, but the ratio stays stable with changing parameters \n(I don't understand why the decay rates have to be larger)

Supp Fig 2c: Output decay rates respond to scaled synthesis rates, therefore its ratio against \ntotal input decay rates shows similar patter as scaled synthesis rates in Fig 2

Supp Fig 2d: Output decay rates for short genes are much less affected by different \nco-translational decay than long genes
```{r fig.height=6, fig.width=8}
allSimInputOutput_trial <- read_feather("../../../exp0/externalData/exp11_outcomeAll.feather")
tmp <- allSimInputOutput_trial %>% 
  filter(combo != "mRNAconstant", w != 0.01, w != 0.05, w != 0.2) %>% 
  select(NMMC, combo, ORF, r, w) %>% # NMMC in trial = RMMC in exp0, "normalized" VS "relative"
  mutate(dc=1-as.numeric(r)) %>%
  select(-r) %>% #delete the original column named "r", in trial data the r means CMD levels, and w means ribosome protection index
  dplyr::rename("r"="w", "paraCombo"="combo", "RMMCtrial"="NMMC") %>% # change the original col named "w" into "r", b/c "r" in exp0 means ribosome protection index
  mutate(paraCombo=paste0("dc_", dc, "_r_", r)) %>%
  select(-dc, -r)
  
    
sup1 <- (allSimInputOutput %>%
    filter(paraCombo != "mRNAconstant") %>%
    left_join(., tmp, by = c("paraCombo"="paraCombo", "ORF"="ORF"))) %>%
    select("paraCombo", "RMMC", "RMMCtrial", "dc", "r") %>%
    dplyr::rename("AfterScaling"="RMMC", "BeforeScaling"="RMMCtrial") %>%
    pivot_longer(names_to = "key", values_to = "RMMCvalue", cols = 2:3) %>%
    ggplot(aes(x=RMMCvalue, color=key)) +
        geom_density() +
        facet_grid(dc~r, labeller=labeller(dc=c("0"="0%", "0.2"="20%", "0.4"="40%", "0.6"="60%", "0.8"="80%", "1"="CMD 100%"), r=c("0"="Ribo prot indx = 0", "0.1"="0.1", "0.4"="0.4", "1"="1"), label_parsed)) + 
        labs(title = "Sup Fig 1: mRNA counts when varying are laregely equal to when they are constant \nafter scaling the mRNA synthesis rates", 
             x="Relative mean mRNA count") +
        scale_y_continuous() +
        geom_vline(xintercept =1, linetype="dashed", color="dark grey") +
        theme_bw() +
        theme(legend.title = element_blank(),
              legend.position = "bottom",
              strip.text.x = element_text(size=10),
              strip.text.y = element_text(size=10)) # make the gridline color darker



############################################ plotting the (total syn rate after scaling)/(input decay rate*mRNAabundance) for all genes for all rw combos
outdf <- tibble(matrix(NA, ncol=nrow(dc.r.df)-1, nrow=4839))

for (i in 1:(nrow(dc.r.df)-1)) 
{
    inf <- read.table(paste0("../../simulations/simInput/allGenesDecrEqualsSynrWithScaling_", dc.r.df$paraCombo[i+1], "_S.cer.mRNA.ini.abndc.syn.dec.tsv"))
    outdf[, i] <- inf[, 3]/(inf[, 4]*inf[, 2])
}

colnames(outdf) <- dc.r.df$paraCombo[2:nrow(dc.r.df)]

sup2a <- outdf %>%
  pivot_longer(names_to = "paraCombo", values_to = "value", cols = 1:(nrow(dc.r.df)-1)) %>%
  left_join(., dc.r.df, by = "paraCombo") %>%
  filter(value != 0, paraCombo == "dc_1_r_0"|paraCombo == "dc_0_r_0"|paraCombo == "dc_1_r_1"|paraCombo == "dc_0_r_1") %>%
  ggplot(aes(x=value)) +
    geom_density() +
    facet_grid(dc~r, labeller=labeller(dc=c("0"="0%", "0.2"="20%", "0.4"="40%", "0.6"="60%", "0.8"="80%", "1"="CMD 100%"), r=c("0"="Ribo prot indx = 0", "0.1"="0.1", "0.4"="0.4", "1"="1"), label_parsed)) +
    geom_vline(xintercept =1, linetype="dashed", color="dark grey") +
    labs(title = "",
         x="Scaled synthesis rates/Total input decay rates") +
    theme_bw() +
    theme(strip.text.x = element_text(size=9),
          strip.text.y = element_blank()) +
    scale_x_continuous(breaks = c(0.9, 1, 1.1, 1.3, 1.5))

############################################## plotting the (output decay rate)/(syn rate after scaling) for all genes for all dc/r paraCombos
mmdrAllgeneAlldcr <- read_feather("../calculatedMetrics/mmdrAllgeneAlldcr.feather")[, 2:nrow(dc.r.df)]
mmcAllgeneAlldcr<- read_feather("../calculatedMetrics/mmcAllgeneAlldcr.feather")[, 2:nrow(dc.r.df)]
totdr <- mmdrAllgeneAlldcr*mmcAllgeneAlldcr

totsynr <- tibble(matrix(NA, ncol=nrow(dc.r.df)-1, nrow=4839))
for (i in 1:(nrow(dc.r.df)-1))
{
    inf <- read.table(paste0("../../simulations/simInput/allGenesDecrEqualsSynrWithScaling_", dc.r.df$paraCombo[i+1], "_S.cer.mRNA.ini.abndc.syn.dec.tsv"))
    totsynr[, i] <- inf[, 3]
}

ratio.dr.synr <- totdr/totsynr
colnames(ratio.dr.synr) <- dc.r.df$paraCombo[2:nrow(dc.r.df)]
ratio.dr.synr <- ratio.dr.synr[-1278, ]   # gene with the HL-min=490 min, the data point skews the scale

sup2b <- ratio.dr.synr %>%
  pivot_longer(names_to = "paraCombo", values_to = "value", cols = 1:(nrow(dc.r.df)-1)) %>%
  left_join(., dc.r.df, by = "paraCombo") %>%
  filter(paraCombo == "dc_1_r_0"|paraCombo == "dc_0_r_0"|paraCombo == "dc_1_r_1"|paraCombo == "dc_0_r_1") %>% 
  filter(!is.na(value)) %>%
  ggplot(aes(x=value)) +
    geom_density() +
    facet_grid(dc~r, labeller=labeller(dc=c("0"="0%", "0.2"="20%", "0.4"="40%", "0.6"="60%", "0.8"="80%", "1"="CMD 100%"), r=c("0"="Ribo prot indx = 0", "0.1"="0.1", "0.4"="0.4", "1"="1"), label_parsed)) +
    labs(title = "", 
         x="Total output decay rates/Scaled synthesis rates") +
    geom_vline(xintercept =1, linetype="dashed", color="dark grey") +
    theme_bw() +
    theme(strip.text.x = element_text(size=9),
          strip.text.y = element_text(size=9),
          axis.title.y = element_blank()) 


############################################ plotting the (output decay rate*real time mRNA)/(input decay rate*mRNAabundance)for all genes for all rw combos
outdf <- tibble(matrix(NA, ncol=nrow(dc.r.df)-1, nrow=4839)) #contains all the total input decay rates

for (i in 1:(nrow(dc.r.df)-1))  # these 16 columns are all the same, all equal to simInputFeatures$mRNAabundance*simInputFeatures$mRNADecRateNeymotin_sec
{
    inf <- read.table(paste0("../../simulations/simInput/allGenesDecrEqualsSynrWithScaling_", dc.r.df$paraCombo[i+1], "_S.cer.mRNA.ini.abndc.syn.dec.tsv"))
    outdf[, i] <- (inf[, 4]*inf[, 2])
}

outdf <- totdr/outdf
colnames(outdf) <- dc.r.df$paraCombo[2:nrow(dc.r.df)]

sup2c <- outdf[-1278, ] %>%       # gene with the HL-min=490 min, the data point skews the scales
  pivot_longer(names_to = "paraCombo", values_to = "value", cols = 1:(nrow(dc.r.df)-1)) %>%
  left_join(., dc.r.df, by = "paraCombo") %>%
  filter(value != 0, paraCombo == "dc_1_r_0"|paraCombo == "dc_0_r_0"|paraCombo == "dc_1_r_1"|paraCombo == "dc_0_r_1") %>%
  ggplot(aes(x=value)) +
    geom_density() +
    facet_grid(dc~r, labeller=labeller(dc=c("0"="0%", "0.2"="20%", "0.4"="40%", "0.6"="60%", "0.8"="80%", "1"="CMD 100%"), r=c("0"="Ribo prot indx = 0", "0.1"="0.1", "0.4"="0.4", "1"="1"), label_parsed)) +
    geom_vline(xintercept =1, linetype="dashed", color="dark grey") +
    labs(title = "",
         x="Total output decay rates/Total input decay rates") +
    theme_bw() +
    theme(#strip.text.x = element_text(size=8),
          strip.text.y = element_blank(),
          strip.text.x = element_blank())  # hide the grid title


############################################
# sl = short or long
outdf$sl <- rep(NA,4839)   
outdf$sl[which(simInputFeatures$geneLength_codon>512)] <- "Long"
outdf$sl[which(simInputFeatures$geneLength_codon<=512)] <- "Short"


sup2d <- outdf[-1278, ] %>%       # took the gene with the HL-min=490 min, the data point skews the scales
  pivot_longer(names_to = "paraCombo", values_to = "value", cols = 1:(nrow(dc.r.df)-1)) %>%
  left_join(., dc.r.df, by = "paraCombo") %>%
  filter(value != 0, paraCombo == "dc_1_r_0"|paraCombo == "dc_0_r_0"|paraCombo == "dc_1_r_1"|paraCombo == "dc_0_r_1") %>%
  ggplot(aes(x=value, color=sl, group=sl)) +
    geom_density() +
    facet_grid(dc~r, labeller=labeller(dc=c("0"="0%", "0.2"="20%", "0.4"="40%", "0.6"="60%", "0.8"="80%", "1"="CMD 100%"), r=c("0"="Ribo prot indx = 0", "0.1"="0.1", "0.4"="0.4", "1"="1"), label_parsed)) +
    labs(title = "",
         x="Total output decay rates/Total input decay rates") +
    geom_vline(xintercept =1, linetype="dashed", color="dark grey") +
    theme_bw() +
    theme(
          strip.text.y = element_text(size=9),
          strip.text.x = element_blank(),
          legend.position = c(0.9, 0.95),
          axis.title.y = element_blank(),
          legend.background=element_blank(), # change the legend background to transparent
          legend.key.size = unit(0.5, "line")) +
    scale_color_discrete(name = "", labels = )
############################################
sup1

sup2 <- (sup2a|sup2b)/(sup2c|sup2d)
sup2 + plot_annotation(
   title = 'Supp Fig 2.',
  # subtitle = 'Supp Fig 2.',
  # caption = 'Hello',   # this one appears at the bottom
  tag_levels = 'a'
)




####################################
tot.in.dr <- tibble(matrix(NA, ncol=nrow(dc.r.df)-1, nrow=4839)) #contains all the total input decay rates

for (i in 1:(nrow(dc.r.df)-1))  # these 16 columns are all the same, all equal to simInputFeatures$mRNAabundance*simInputFeatures$mRNADecRateNeymotin_sec
{
    inf <- read.table(paste0(basefolder, expID, "/input/allGenesDecrEqualsSynrWithScaling_", dc.r.df$paraCombo[i+1], "_S.cer.mRNA.ini.abndc.syn.dec"))
    tot.in.dr[, i] <- (inf[, 4]*inf[, 2])
}

mmdrAllgeneAlldcr <- read_feather(paste0(basefolder, expID, "/analyses/featherFiles/mmdrAllgeneAlldcr.feather"))[, 2:nrow(dc.r.df)]
mmcAllgeneAlldcr<- read_feather(paste0(basefolder, expID, "/analyses/featherFiles/mmcAllgeneAlldcr.feather"))[, 2:nrow(dc.r.df)]
tot.out.dr <- mmdrAllgeneAlldcr*mmcAllgeneAlldcr

outdf <- tot.out.dr/tot.in.dr
colnames(outdf) <- dc.r.df$paraCombo[2:nrow(dc.r.df)]

outdf[-1278, ] %>%       # gene with the HL-min=490 min, the data point skews the scales
  pivot_longer(names_to = "paraCombo", values_to = "outInDrRatio", cols = 1:(nrow(dc.r.df)-1)) %>%
  left_join(., dc.r.df, by = "paraCombo") %>%
  filter(outInDrRatio != 0) %>%
  mutate(dc_fct=factor(dc, levels=c("1", "0.8", "0.6", "0.4", "0.2", "0"))) %>%
  ggplot(aes(x=dc_fct, y=outInDrRatio, fill=r)) +
  geom_boxplot(outlier.size = 0.1) +
  geom_hline(aes(yintercept=median(as.numeric(unlist(outdf %>%select(dc_1_r_0)))[-1278], na.rm = TRUE)), 
             color="red", linetype="dashed") +
  theme_bw() +
  labs(x="CMD level",
       y="Ratio between total output/input decay rates") +
  scale_x_discrete(labels=c("1"="100%", "0.8"="80%", "0.6"="60%", "0.4"="40%", "0.2"="20%", "0"="0")) +
  scale_fill_discrete(name = "Ribosome\nprot index") +
  theme(
    text = element_text(size = 13),
    legend.position = "none"
  )


##############
outdf <- tibble(matrix(NA, ncol=nrow(dc.r.df)-1, nrow=4839)) #contains all the total input decay rates

for (i in 1:(nrow(dc.r.df)-1))  # these 16 columns are all the same, all equal to simInputFeatures$mRNAabundance*simInputFeatures$mRNADecRateNeymotin_sec
{
    inf <- read.table(paste0(basefolder, expID, "/input/allGenesDecrEqualsSynrWithScaling_", dc.r.df$paraCombo[i+1], "_S.cer.mRNA.ini.abndc.syn.dec"))
    outdf[, i] <- (inf[, 4]*inf[, 2])
}


outdf <- totdr/outdf
colnames(outdf) <- dc.r.df$paraCombo[2:nrow(dc.r.df)]


outdf %>%
  mutate(mRNAabundance=simInputFeatures$mRNAabundance, mRNADecRateNeymotin_sec=simInputFeatures$mRNADecRateNeymotin_sec, ORF=simInputFeatures$ORF) %>%
  pivot_longer(names_to = "paraCombo", values_to = "ratioVal", cols = !c(mRNAabundance, mRNADecRateNeymotin_sec, ORF)) %>%
  filter(paraCombo == "dc_0_r_1", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A") %>%
  ggplot(aes(x=mRNAabundance, y=ratioVal)) +
  geom_point() +
  theme_bw() +
  scale_x_log10()
  
```









Fig. S
```{r}
l %>%
  filter(paraCombo == "dc_1_r_0", mRNADecRateNeymotin_sec != 0, ORF != "YCR024C-B", mRNAabundance != 1) %>%
  mutate(relativeFano = RMVPS/RMPSR) %>%
  ggplot(aes(x=RMPSR, y=relativeFano)) +
  geom_point(size=0.1) +
  scale_x_log10() +
  scale_y_log10() +
      labs(x= "Realtive mean protein synthesis rate",
        y = "Relative fano factor in protein synthesis rate",
        title = "") +
    geom_smooth(method="lm") + 
    stat_cor(aes(label=paste(..r.label.., sep = "~`, `~")), label.x.npc = 0.1, label.y.npc = 0.3, size=3) + 
    theme_bw() 



```


```{r}
allSimInputOutput %>%
    filter(paraCombo == "dc_1_r_0", mRNADecRateNeymotin_sec != 0, ORF != "YCR024C-B", mRNAabundance != 1) %>%
    ggplot(aes(x=MRD, y=RMVTE)) +
    geom_point(size=0.1) +
    scale_x_log10() +
    scale_y_log10() +
    labs(x= "Mean ribosome density",
        y = "Relative mean of variance in translation efficiency",
        title = "") +
    geom_smooth(method="lm") + 
    stat_cor(aes(label=paste(..r.label.., sep = "~`, `~")), label.x.npc = 0.1, label.y.npc = 0.3, size=3) + 
    theme_bw() 


allSimInputOutput %>%
    filter(paraCombo == "dc_1_r_0", mRNADecRateNeymotin_sec != 0, ORF != "YCR024C-B", mRNAabundance != 1) %>%
    ggplot(aes(x=MMDP, y=mRNADecRateNeymotin_sec)) +
    geom_point(size=0.1) +
    scale_x_log10() +
    scale_y_log10() +
    labs(x= "Mean ribosome density",
        y = "Relative mean of variance in translation efficiency",
        title = "") +
    geom_smooth(method="lm") + 
    stat_cor(aes(label=paste(..r.label..,  sep = "~`, `~")), label.x.npc = 0.1, label.y.npc = 0.3, size=3) + 
    theme_bw() 

```



Figure S.
```{r}

# calculating the mean number of free ribos (averaged over simuTime and techReps) for all dc.r.paraCombos
# RMFR = relative mean free ribo
mfr <- c() 
for(i in 1:nrow(dc.r.df)) # loop through the dc/r parameter space to calculate the mean free ribo
{
    # free_ribo averaged by simuTime and techReps
    mfr <- c(mfr, mean(h5read(simOutputH5, paste("free_ribo_tRNA_perMin", dc.r.df$paraCombo[i], "ribo", sep="/")), na.rm = TRUE))
    # set na.rm=T because in rep 66 again there's an NA at the last minute, which won't affect the overall mean
}

rmfr <- mfr/mfr[1]
rmfr_df <- data.frame(RMFR = rmfr,
                      MFR = mfr,
                      para = dc.r.df$para)

# rmfr_df can be found in exp0_prepPlots.Rmd
rmfr_df %>%
  left_join(., dc.r.df, by ="para") %>%
  filter(paraCombo != "mRNAconstant") %>%
  select(RMFR, dc, r) %>%
  spread(dc, RMFR) %>%
  select(-r) %>%
  colMeans() %>%
  tibble() %>% 
  mutate(dc=as.character(seq(0, 1, by=0.2))) %>%
  `colnames<-`(c("RMFRmeanByCoTrans", "dc")) %>%
    mutate(cotrans = paste0(as.numeric(dc)*100, "%")) %>%
    ggplot(aes(x=cotrans, y=RMFRmeanByCoTrans)) +
    geom_point() +
    theme_bw() +
    labs ( title = "",
                x ="Co-translational decay proportion",
                y = "Mean free ribosomes (relative to mRNA constant)") +
    theme(text = element_text(size = 13),
          panel.grid = element_blank()) +
    scale_x_discrete(limits = c("100%", "80%", "60%", "40%", "20%", "0%"))
  
```

```{r}

make_heatmap <- function(orderVar, outputVar, legendName, titleY)
{
    colorvec <- quantile(allSimInputOutput[[outputVar]])
  
    tmp <- (allSimInputOutput%>%filter(paraCombo == "dc_1_r_0"))[, c("ORF", orderVar)]
    tmp <- tmp[order(tmp[, 2], decreasing = T), ]
    tmp$newid_dc1r0 <- 1:4839
    
    allSimInputOutput %>% 
        filter(paraCombo != "mRNAconstant") %>% 
        left_join(., tmp[, c("ORF", "newid_dc1r0")], by = "ORF") %>%
        mutate(dc_fct=factor(dc, levels=c("1", "0.8", "0.6", "0.4", "0.2", "0"))) %>%
        ggplot(aes_string(x = "r", 
                   y = "factor(newid_dc1r0)",
                   fill = outputVar)) +
        geom_raster() +
        theme_bw() +
        scale_fill_gradientn(colours = c("#377eb8", "white", "#e41a1c"),   # blue white red
                        values = scales::rescale(colorvec), name=legendName) +
        facet_wrap(~dc_fct, nrow=1, labeller=labeller(dc_fct=c("1"="Co-trans 100%", "0.8"="80%", "0.6"="60%", "0.4"="40%", "0.2"="20%", "0"="0"))) + 
        labs ( x = "Ribosome protection index r",
               y = titleY,
               title = "") +
        theme(text = element_text(size = 18),
              axis.text.y = element_blank(),
              axis.ticks.y = element_blank(),
              panel.border = element_blank(),  # remove the grid lines in facet_grid
              panel.spacing=unit(0, "lines")) +   # reset the spacing between facets
         guides(fill = guide_colourbar(barwidth = 1, barheight = 10)) +
         scale_x_discrete(expand = c(0, 0)) # remove the extra space beyond xlim

}


```

```{r fig.height=8}
# 1st var= the variable column the sorting is based on
# 2nd var= the variable column presented in the heatmap
# 3rd var= the legend text
# 4th var= y-axis title

make_heatmap("RMTE", "RMTE", "Relative\nmean translation\nefficiency", "Genes ranked by the first column")
make_heatmap("RMVTE", "RMVTE", "Relative mean\nof the variance\nin translation\nefficiency", "Genes ranked by the first column")

########################################################## add a plot for mRNAs marked for decay
colorvec <- quantile((allSimInputOutput%>% filter(paraCombo != "mRNAconstant", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A"))$MMDP)

tmp <- (allSimInputOutput%>%filter(paraCombo == "dc_1_r_0"))[, c("ORF", "RMTE")]
tmp <- tmp[order(tmp[, 2], decreasing = T), ]
tmp$newid_dc1r0 <- 1:4839

allSimInputOutput %>% 
    mutate(dc_fct=factor(dc, levels=c("1", "0.8", "0.6", "0.4", "0.2", "0"))) %>%
    filter(paraCombo != "mRNAconstant", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", dc != 0) %>% 
    left_join(., tmp[, c("ORF", "newid_dc1r0")], by = "ORF") %>%
    ggplot(aes(x = r, 
               y = factor(newid_dc1r0),
               #y = as.character(newid_geneLength_codon),   # genes are sorted by geneLength_codon within each group
               fill = MMDP)) +
    geom_raster() +
    theme_bw() +
    scale_fill_gradientn(colours = c("#377eb8", "white", "#e41a1c"),   # blue white red
                    values = scales::rescale(colorvec), name="mRNAs marked\nfor decay ratio") +
    facet_wrap(~dc_fct, nrow=1, labeller=labeller(dc_fct=c("1"="Co-trans 100%", "0.8"="80%", "0.6"="60%", "0.4"="40%", "0.2"="20%", "0"="0%"))) +
    labs ( x = "Ribosome protection index w",
           y = "Genes ranked by the first column in translation efficiency plot",
           title = "") +
    theme(text = element_text(size = 18),
          plot.title = element_text(size=rel(1.5)),
          axis.text.y = element_blank(),
          axis.ticks.y = element_blank(),
          panel.border = element_blank(),  # remove the grid lines in facet_grid
          panel.spacing=unit(0, "lines")) +   # reset the spacing between facets
     guides(fill = guide_colourbar(barwidth = 1, barheight = 10)) +
     scale_x_discrete(expand = c(0, 0)) # remove the extra space beyond xlim


########################################################## add another plot for mRNAs marked for decay
colorvec <- quantile((allSimInputOutput%>% filter(paraCombo != "mRNAconstant", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A"))$MMDP)

tmp <- (allSimInputOutput%>%filter(paraCombo == "dc_1_r_0"))[, c("ORF", "RMVTE")]
tmp <- tmp[order(tmp[, 2], decreasing = T), ]
tmp$newid_dc1r0 <- 1:4839

allSimInputOutput %>% 
    mutate(dc_fct=factor(dc, levels=c("1", "0.8", "0.6", "0.4", "0.2", "0"))) %>%
    filter(paraCombo != "mRNAconstant", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A", dc != 0) %>% 
    left_join(., tmp[, c("ORF", "newid_dc1r0")], by = "ORF") %>%
    ggplot(aes(x = r, 
               y = factor(newid_dc1r0),
               fill = MMDP)) +
    geom_raster() +
    theme_bw() +
    scale_fill_gradientn(colours = c("#377eb8", "white", "#e41a1c"),   # blue white red
                    values = scales::rescale(colorvec), name="mRNAs marked\nfor decay ratio") +
    facet_wrap(~dc_fct, nrow=1, labeller=labeller(dc_fct=c("1"="Co-trans 100%", "0.8"="80%", "0.6"="60%", "0.4"="40%", "0.2"="20%", "0"="0%"))) +
    labs ( x = "Ribosome protection index w",
           y = "Genes ranked by the first column in translation efficiency plot",
           title = "") +
    theme(text = element_text(size = 18),
          plot.title = element_text(size=rel(1.5)),
          axis.text.y = element_blank(),
          axis.ticks.y = element_blank(),
          panel.border = element_blank(),  # remove the grid lines in facet_grid
          panel.spacing=unit(0, "lines")) +   # reset the spacing between facets
     guides(fill = guide_colourbar(barwidth = 1, barheight = 10)) +
     scale_x_discrete(expand = c(0, 0)) # remove the extra space beyond xlim

```


```{r fig.height=8}
# 1st var= the variable column the sorting is based on
# 2nd var= the variable column presented in the heatmap
# 3rd var= the legend text
# 4th var= y-axis title

make_heatmap("RMPSR", "RMPSR", "Relative\nmean protein\nsyn rate", "Genes ranked by the first column")
make_heatmap("RMVPS", "RMVPS", "Relative\nmean of variance in\nprotein syn rate", "Genes ranked by the first column")

make_heatmap_tmp <- function(orderVar, outputVar, legendName, titleY)
{
    colorvec <- quantile(allSimInputOutput[[outputVar]])
  
    tmp <- (allSimInputOutput%>%filter(paraCombo == "dc_1_r_0"))[, c("ORF", orderVar)]
    tmp <- tmp[order(tmp[, 2], decreasing = T), ]
    tmp$newid_dc1r0 <- 1:4839
    
    allSimInputOutput %>% 
        filter(paraCombo != "mRNAconstant", RMVTBR != Inf) %>% 
        left_join(.,tmp[, c("ORF", "newid_dc1r0")], by = "ORF") %>%
        mutate(dc_fct=factor(dc, levels=c("1", "0.8", "0.6", "0.4", "0.2", "0"))) %>%
        ggplot(aes_string(x = "r", 
                   y = "factor(newid_dc1r0)",
                   fill = outputVar)) +
        geom_raster() +
        theme_bw() +
        scale_fill_gradientn(colours = c("#377eb8", "white", "#e41a1c"),   # blue white red
                        values = scales::rescale(colorvec), name=legendName) +
        facet_wrap(~dc_fct, nrow=1, labeller=labeller(dc_fct=c("1"="Co-trans 100%", "0.8"="80%", "0.6"="60%", "0.4"="40%", "0.2"="20%", "0"="0"))) + 
        labs ( x = "Ribosome protection index r",
               y = titleY,
               title = "") +
        theme(text = element_text(size = 18),
              axis.text.y = element_blank(),
              axis.ticks.y = element_blank(),
              panel.border = element_blank(),  # remove the grid lines in facet_grid
              panel.spacing=unit(0, "lines")) +   # reset the spacing between facets
         guides(fill = guide_colourbar(barwidth = 1, barheight = 10)) +
         scale_x_discrete(expand = c(0, 0)) # remove the extra space beyond xlim

}
make_heatmap_tmp("RMTE", "RMVTBR", "Relative\nvariance in total\nbound ribosomes", "Genes ranked by the first column in relative TE")


make_heatmap("MML", "MML", "Mean of mRNA\nlife-times", "Genes ranked by the first column")

###############################################################
colorvec <- quantile((allSimInputOutput%>% filter(paraCombo != "mRNAconstant", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A"))$RMRD)

tmp <- (allSimInputOutput%>%filter(paraCombo == "dc_1_r_0"))[, c("ORF", "RMTE")]
tmp <- tmp[order(tmp[, 2], decreasing = T), ]
tmp$newid_dc1r0 <- 1:4839


allSimInputOutput %>% 
    filter(paraCombo != "mRNAconstant", mRNADecRateNeymotin_sec != 0, ORF != "YER053C-A") %>% 
    left_join(., tmp[, c("ORF", "newid_dc1r0")], by = "ORF") %>%
    ggplot(aes(x = r, 
               y = factor(newid_dc1r0),
               fill = RMRD)) +
    geom_raster() +
    theme_bw() +
    scale_fill_gradientn(colours = c("#377eb8", "white", "#e41a1c"),   # blue white red
                    values = scales::rescale(colorvec), name="Relative mean\nribo density") +
    facet_wrap(~dc, nrow=1, labeller=labeller(dc=c("1"="Co-trans 100%", "0.8"="0.8", "0.6"="0.6", "0.4"="0.4", "0.2"="0.2", "0"="0"))) +
    labs ( x = "Ribosome protection index",
           y = "Genes ranked by the first column for translation efficiency",
           title = "") +
    theme(text = element_text(size = 18),
          plot.title = element_text(size=rel(1.5)),
          axis.text.y = element_blank(),
          axis.ticks.y = element_blank(),
          panel.border = element_blank(),  # remove the grid lines in facet_grid
          panel.spacing=unit(0, "lines")) +   # reset the spacing between facets
     guides(fill = guide_colourbar(barwidth = 1, barheight = 10)) +
     scale_x_discrete(expand = c(0, 0)) # remove the extra space beyond xlim
```
